lo-ranking/s1.py

#!/usr/bin/env python
# -*- coding:utf-8 -*-
'''
Step 1
'''
from __future__ import print_function
from base import Lo, RAW_DIR, TARGET_DIR
import os
import csv
import sys


los = Lo()


def get_rank_thing(filename, **kwargs):
    model_count = {
        'I': {}, 'P': {}, 'C': {}, 'M': {}, 'F': {},
        'H': {}, 'S': {}, 'D': {}, 'f': {}
    }
    output_filename = kwargs.get('output', '%s-output.csv' % filename)
    count = tot = lo_match = 0
    with open(os.path.join(TARGET_DIR, output_filename), 'wb') as o:
        owriter = csv.writer(o, delimiter=',', quotechar='"',
                             quoting=csv.QUOTE_ALL)
        with open(os.path.join(RAW_DIR, filename)) as f:
            reader = csv.reader(f)
            reader.next()
            for r in reader:
                mn, rank_no = r[0], r[9]
                w = [
                    r[1], r[2], r[3], r[4], r[5], r[6], r[7], r[8],  # July 1
                    rank_no,  # July 1
                ]
                ## add 24 model's weight
                for i in xrange(10, 34):
                    w.append(r[i])
                q = (
                    ('A', r[1]), ('B', r[2]), ('C', r[3]), ('D', r[4]),
                    ('E', r[5]), ('F', r[6]), ('G', r[7]), ('H', r[8]),
                )
                result = los.get_mm_tuple(q)
                tot += 1
                lo_match += len(result)
                if result:
                    # print(u'%s > %s' % (r[0], list(result)))
                    count += 1
                    owriter.writerow([
                        mn,
                        ','.join(list(result)),
                        len(result),
                        # rank_no
                    ] + w)
                    if rank_no not in model_count[mn]:
                        model_count[mn][rank_no] = set()
                    model_count[mn][rank_no] = model_count[mn][rank_no].union(result)
    print(u'[%s]\n    Count = %s | Total = %s | Lo_w_match = %s' % (
        filename, count, tot, lo_match))
    return model_count


def main(*argv):
    fs = ('Case1_LS.csv', 'Case1_Gender.csv',
          'Case1_Level.csv', 'Case1_SciF.csv')
    result = ['IPC', 'MF', 'HS', 'fD']
    for f in xrange(0, len(fs)):
        mc = get_rank_thing(fs[f])
        x = {}
        for i in result[f]:
            x[i] = mc[i]
        # print('x: ', x)
        mx = [set(j) for i, j in x.items()]
        order = sorted(list(set.union(*mx)))
        sum_file = '%s-result.csv' % fs[f]
        with open(os.path.join(TARGET_DIR, sum_file), 'wb') as o:
            result_writer = csv.writer(o, delimiter=',', quotechar='"',
                                       quoting=csv.QUOTE_ALL)
            m = {}
            # print(j, ':', order)
            for i in xrange(0, len(order)):
                result_writer.writerow(['rank_no', order[i]])
                # print('count , ', order[i], ' / ', type(order[i]))
                for j in x.keys():
                    try:
                        # print(j, ', ', s)
                        lo_result = mc[j][order[i]]
                        # print(order[i], ' == ', len(lo_result))
                        # if i == 2 and len(mc[j]) > 3:
                        #     for _i in xrange(3, len(mc[j])):
                        #         lo_result = lo_result.union(mc[j][order[_i]])
                        #         # print(' ==EX== ', len(lo_result))
                        if j not in m:
                            m[j] = lo_result
                        else:
                            m[j] = m[j].union(lo_result)
                        result_writer.writerow([j, ','.join(list(lo_result))])
                    except KeyError:
                        print(' no key ', j, '[', order[i], ']')
            result_writer.writerow(['All Result', ''])
            for _m in m.keys():
                result_writer.writerow([_m, ','.join(list(m[_m]))])

if __name__ == '__main__':
    if len(sys.argv) > 1:
        main(sys.argv[1:])
    else:
        main()
First commit 11 years ago			`#!/usr/bin/env python`
s7 add yynn_count 10 years ago			`# -- coding:utf-8 --`
			`'''`
			`Step 1`
			`'''`
First commit 11 years ago			`from __future__ import print_function`
[july] s1 with all 24 weight values 10 years ago			`from base import Lo, RAW_DIR, TARGET_DIR`
Update step 1 completed 11 years ago			`import os`
			`import csv`
			`import sys`
First commit 11 years ago

			`los = Lo()`

Update step 1 completed 11 years ago
			`def get_rank_thing(filename, **kwargs):`
			`model_count = {`
			`'I': {}, 'P': {}, 'C': {}, 'M': {}, 'F': {},`
Part 2 should be completed 11 years ago			`'H': {}, 'S': {}, 'D': {}, 'f': {}`
Update step 1 completed 11 years ago			`}`
			`output_filename = kwargs.get('output', '%s-output.csv' % filename)`
First commit 11 years ago			`count = tot = lo_match = 0`
[july] s1 with all 24 weight values 10 years ago			`with open(os.path.join(TARGET_DIR, output_filename), 'wb') as o:`
Update step 1 completed 11 years ago			`owriter = csv.writer(o, delimiter=',', quotechar='"',`
			`quoting=csv.QUOTE_ALL)`
[july] s1 with all 24 weight values 10 years ago			`with open(os.path.join(RAW_DIR, filename)) as f:`
Update step 1 completed 11 years ago			`reader = csv.reader(f)`
			`reader.next()`
			`for r in reader:`
Update algorithm by request 11 years ago			`mn, rank_no = r[0], r[9]`
July 1 requested 11 years ago			`w = [`
			`r[1], r[2], r[3], r[4], r[5], r[6], r[7], r[8], # July 1`
			`rank_no, # July 1`
			`]`
[july] s1 with all 24 weight values 10 years ago			`## add 24 model's weight`
			`for i in xrange(10, 34):`
			`w.append(r[i])`
Update step 1 completed 11 years ago			`q = (`
			`('A', r[1]), ('B', r[2]), ('C', r[3]), ('D', r[4]),`
			`('E', r[5]), ('F', r[6]), ('G', r[7]), ('H', r[8]),`
			`)`
			`result = los.get_mm_tuple(q)`
			`tot += 1`
			`lo_match += len(result)`
			`if result:`
			`# print(u'%s > %s' % (r[0], list(result)))`
			`count += 1`
July 1 requested 11 years ago			`owriter.writerow([`
			`mn,`
			`','.join(list(result)),`
			`len(result),`
			`# rank_no`
			`] + w)`
Update algorithm by request 11 years ago			`if rank_no not in model_count[mn]:`
			`model_count[mn][rank_no] = set()`
			`model_count[mn][rank_no] = model_count[mn][rank_no].union(result)`
First commit 11 years ago			`print(u'[%s]\n Count = %s \| Total = %s \| Lo_w_match = %s' % (`
Update step 1 completed 11 years ago			`filename, count, tot, lo_match))`
			`return model_count`
First commit 11 years ago

Update step 1 completed 11 years ago			`def main(*argv):`
			`fs = ('Case1_LS.csv', 'Case1_Gender.csv',`
			`'Case1_Level.csv', 'Case1_SciF.csv')`
typo 11 years ago			`result = ['IPC', 'MF', 'HS', 'fD']`
Update step 1 completed 11 years ago			`for f in xrange(0, len(fs)):`
			`mc = get_rank_thing(fs[f])`
			`x = {}`
			`for i in result[f]:`
			`x[i] = mc[i]`
			`# print('x: ', x)`
			`mx = [set(j) for i, j in x.items()]`
Update algorithm by request 11 years ago			`order = sorted(list(set.union(*mx)))`
Update step 1 completed 11 years ago			`sum_file = '%s-result.csv' % fs[f]`
[july] s1 with all 24 weight values 10 years ago			`with open(os.path.join(TARGET_DIR, sum_file), 'wb') as o:`
Update step 1 completed 11 years ago			`result_writer = csv.writer(o, delimiter=',', quotechar='"',`
			`quoting=csv.QUOTE_ALL)`
Add missing all result 11 years ago			`m = {}`
This should fix misunderstanding I have previously There is no more limit in rank since max is #4 anyway 11 years ago			`# print(j, ':', order)`
			`for i in xrange(0, len(order)):`
Update algorithm by request 11 years ago			`result_writer.writerow(['rank_no', order[i]])`
Update step 1 completed 11 years ago			`# print('count , ', order[i], ' / ', type(order[i]))`
			`for j in x.keys():`
			`try:`
			`# print(j, ', ', s)`
			`lo_result = mc[j][order[i]]`
			`# print(order[i], ' == ', len(lo_result))`
This should fix misunderstanding I have previously There is no more limit in rank since max is #4 anyway 11 years ago			`# if i == 2 and len(mc[j]) > 3:`
			`# for _i in xrange(3, len(mc[j])):`
			`# lo_result = lo_result.union(mc[j][order[_i]])`
			`# # print(' ==EX== ', len(lo_result))`
Add missing all result 11 years ago			`if j not in m:`
			`m[j] = lo_result`
			`else:`
			`m[j] = m[j].union(lo_result)`
Update step 1 completed 11 years ago			`result_writer.writerow([j, ','.join(list(lo_result))])`
			`except KeyError:`
			`print(' no key ', j, '[', order[i], ']')`
Add missing all result 11 years ago			`result_writer.writerow(['All Result', ''])`
			`for _m in m.keys():`
			`result_writer.writerow([_m, ','.join(list(m[_m]))])`
First commit 11 years ago
			`if __name__ == '__main__':`
Update step 1 completed 11 years ago			`if len(sys.argv) > 1:`
			`main(sys.argv[1:])`
			`else:`
			`main()`