-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathparsing.py
executable file
·100 lines (79 loc) · 1.92 KB
/
parsing.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
import random
fobj = open("output.log")
url_list = []
size_list = []
url_list.append("START")
size_list.append(0)
found = 0
for line in fobj :
token = line.split('|')
if token[0] == "SIZE" :
curr_size = token[3]
curr_url = token[1]
list_len = len(url_list)
for i in xrange(0, len(url_list)) :
if int(size_list[i]) < int(curr_size) and found == 0:
found = 1
url_list.insert(i, curr_url)
size_list.insert(i, curr_size)
found = 0
A_size = []
A_url = []
B_size = []
B_url = []
C_size = []
C_url = []
D_size = []
D_url = []
E_size = []
E_url = []
for i in xrange(0, len(url_list)) :
if int(size_list[i]) > 100000 :
A_url.append(url_list[i])
A_size.append(size_list[i])
elif int(size_list[i]) > 50000 :
B_url.append(url_list[i])
B_size.append(size_list[i])
elif int(size_list[i]) > 10000 :
C_url.append(url_list[i])
C_size.append(size_list[i])
elif int(size_list[i]) > 1000 :
D_url.append(url_list[i])
D_size.append(size_list[i])
else:
E_url.append(url_list[i])
E_size.append(size_list[i])
def print_list(pa_list):
for i in xrange(0, len(pa_list)) :
print "%s" %(pa_list[i])
def print_all(pa_list, pa_size):
for i in xrange(0, len(pa_list)) :
print "%s | %s" %(pa_list[i], pa_size[i])
def print_random(pa_list, pa_size, number):
size = len(pa_list)
found_list = []
found_size = []
found = 0
tmp = 0
for i in xrange(0, number):
index = random.randint(0,size-1)
tmp = pa_list[index]
tmp_size = pa_size[index]
for j in xrange(0, len(found_list)) :
if tmp == found_list[j] :
found = 1
if found == 0:
found_list.append(tmp)
found_size.append(tmp_size)
print_list(found_list)
#print_all(found_list, found_size)
number = 5
#D C D E D C D E
print_list(D_url)
print_random(C_url, C_size, number)
print_list(D_url)
print_random(E_url, E_size, number)
print_list(D_url)
print_random(C_url, C_size, number)
print_list(D_url)
print_random(E_url, E_size, number)