59 lines
1.4 KiB
Python
59 lines
1.4 KiB
Python
|
#!/usr/bin/env python
|
||
|
import sys
|
||
|
import os
|
||
|
|
||
|
libdir = os.path.join(os.path.dirname(os.path.realpath(__file__)), '../lib')
|
||
|
sys.path.append(libdir)
|
||
|
|
||
|
def main(fname):
|
||
|
with open(fname, 'rt') as f:
|
||
|
text = f.read()
|
||
|
|
||
|
cardstats = text.split('\n')
|
||
|
nonempty = 0
|
||
|
name_avg = 0
|
||
|
name_dupes = 0
|
||
|
card_avg = 0
|
||
|
card_dupes = 0
|
||
|
|
||
|
for c in cardstats:
|
||
|
fields = c.split('|')
|
||
|
if len(fields) < 4:
|
||
|
continue
|
||
|
nonempty += 1
|
||
|
idx = int(fields[0])
|
||
|
name = str(fields[1])
|
||
|
ndist = float(fields[2])
|
||
|
cdist = float(fields[3])
|
||
|
|
||
|
name_avg += ndist
|
||
|
if ndist == 1.0:
|
||
|
name_dupes += 1
|
||
|
card_avg += cdist
|
||
|
if cdist == 1.0:
|
||
|
card_dupes += 1
|
||
|
|
||
|
name_avg = name_avg / float(nonempty)
|
||
|
card_avg = card_avg / float(nonempty)
|
||
|
|
||
|
print str(nonempty) + ' cards'
|
||
|
print '-- names --'
|
||
|
print 'avg distance: ' + str(name_avg)
|
||
|
print 'num duplicates: ' + str(name_dupes)
|
||
|
print '-- cards --'
|
||
|
print 'avg distance: ' + str(card_avg)
|
||
|
print 'num duplicates: ' + str(card_dupes)
|
||
|
print '----'
|
||
|
|
||
|
if __name__ == '__main__':
|
||
|
|
||
|
import argparse
|
||
|
parser = argparse.ArgumentParser()
|
||
|
|
||
|
parser.add_argument('infile', #nargs='?'. default=None,
|
||
|
help='data file to process')
|
||
|
|
||
|
args = parser.parse_args()
|
||
|
main(args.infile)
|
||
|
exit(0)
|