-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathstatistics.py
62 lines (57 loc) · 2.04 KB
/
statistics.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
import argparse
def get_args():
"""Parse command line."""
parser = argparse.ArgumentParser()
parser.add_argument("--input", help="input txt file", required=True)
parser.add_argument("--output", help="output csv file", required=True)
args = parser.parse_args()
return args
def statistics(INPUT_FILE, OUTPUT_FILE):
# collect values
values=[]
with open(INPUT_FILE, 'r') as input_file:
line = input_file.readline()
while line:
pairs = line.strip().split(',')
if len(pairs)>=2:
values.append(pairs[0])
values.append(pairs[1])
line = input_file.readline()
# unique
values=list(set(values))
# statistics
# statistics_data={}
intervals = [[ 50, 100, 0]
,[ 100, 200, 0]
,[ 200, 300, 0]
,[ 300, 400, 0]
,[ 400, 500, 0]
,[ 500, 1000, 0]
,[1000, 2000, 0]
,[2000, 6000, 0]
,[6000, float('inf'), 0]
]
for index, value in enumerate(values):
size=len(value)
# if not statistics_data.has_key(size):
# statistics_data[size]=1
# else:
# statistics_data[size]=statistics_data[size]+1
for index, interval in enumerate(intervals):
start, end, count = interval
if start<=size and size<end:
intervals[index][2] = count+1
# write to output_file
# with open(OUTPUT_FILE, 'w') as output_file:
# for size, count in statistics_data.items():
# line=str(size)+','+str(count)
# output_file.write(line+'\n')
with open(OUTPUT_FILE, 'w') as output_file:
for index, interval in enumerate(intervals):
start, end, count = interval
line=str(start)+','+str(count)
output_file.write(line+'\n')
if __name__=="__main__":
"""main."""
args = get_args()
statistics(args.input, args.output)