summaryrefslogtreecommitdiff
path: root/rssb_statistics/delete_len_st.py
blob: 010dc84a0cf0284474726d9001885bec44bc844b (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
import os
import re
import csv
import bisect
cmd1 = "cat survey.log.2018* | grep \"recv survey\" > survey.recv_survey.log"
cmd2 = "cat ../12.log/media_expire.log.2018* > ../12.log/media_expire.log"
cmd3 = "cat media_expire.log.2018* > media_expire.log"
os.system(cmd1)
os.system(cmd2)
os.system(cmd3)
breakpoints = [1048576,1310720,1572864,1835008,2097152,3145728,4194304]
st_num = [0,0,0,0,0,0,0,0]
mid_13_set=set()
mid_12_set=set()
mid_12_file = "../12.log/media_expire.log"
mid_13_file = "media_expire.log"

i=0
with open(mid_13_file,'r') as infile:
	for line in infile:
		i+=1
		if(i%100000==0):
			print i
		line_result = re.split(r",|MID:|media_len:",line)
		mid_13_set.add(int(line_result[3]))

i=0
with open(mid_12_file,'r') as infile:
	for line in infile:
		i+=1
		if(i%100000==0):
			print i
		line_result = re.split(r",|MID:|media_len:",line)
		mid_12_set.add(int(line_result[3]))

different = mid_12_set.difference(mid_13_set)

i=0	
with open(mid_12_file,'r') as infile:
	for line in infile:
		i+=1
		if(i%100000==0):
			print i
		line_result = re.split(r",|MID:|media_len:",line)
		if((int(line_result[3]) in different)==True):
			j = bisect.bisect(breakpoints,int(line_result[6]))
			st_num[j]+=1
print st_num