1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
|
import os
import re
import csv
import bisect
cmd1 = "cat survey.log.2018* | grep \"recv survey\" > survey.recv_survey.log"
cmd2 = "cat ../12.log/media_expire.log.2018* > ../12.log/media_expire.log"
cmd3 = "cat media_expire.log.2018* > media_expire.log"
os.system(cmd1)
os.system(cmd2)
os.system(cmd3)
breakpoints = [1048576,1310720,1572864,1835008,2097152,3145728,4194304]
st_num = [0,0,0,0,0,0,0,0]
mid_13_set=set()
mid_12_set=set()
mid_12_file = "../12.log/media_expire.log"
mid_13_file = "media_expire.log"
i=0
with open(mid_13_file,'r') as infile:
for line in infile:
i+=1
if(i%100000==0):
print i
line_result = re.split(r",|MID:|media_len:",line)
mid_13_set.add(int(line_result[3]))
i=0
with open(mid_12_file,'r') as infile:
for line in infile:
i+=1
if(i%100000==0):
print i
line_result = re.split(r",|MID:|media_len:",line)
mid_12_set.add(int(line_result[3]))
different = mid_12_set.difference(mid_13_set)
i=0
with open(mid_12_file,'r') as infile:
for line in infile:
i+=1
if(i%100000==0):
print i
line_result = re.split(r",|MID:|media_len:",line)
if((int(line_result[3]) in different)==True):
j = bisect.bisect(breakpoints,int(line_result[6]))
st_num[j]+=1
print st_num
|