-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathread_txt.py
More file actions
120 lines (102 loc) · 2.07 KB
/
read_txt.py
File metadata and controls
120 lines (102 loc) · 2.07 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
data_path="./data/"
train_path="train.txt"
result_path="test.txt"
max_len=0
min_len=1000
hh=[]
def str2int(a):
temp=a.split(" ")
for i in range(len(temp)):
temp[i] = int(temp[i])
return temp
def get_train():
f = open(data_path + train_path, "r")
lines = f.readlines()
texta = []
textb = []
labels = []
for i in lines:
a = i.split("\t")
texta.append(str2int(a[0]))
textb.append(str2int(a[1]))
labels.append(str2int(a[2]))
return texta,textb,labels
def get_result():
f = open(data_path + result_path, "r")
lines = f.readlines()
texta = []
textb = []
for i in lines:
a = i.split("\t")
texta.append(str2int(a[0]))
textb.append(str2int(a[1]))
return texta,textb
texta,textb,labels=get_train()
resulta,resultb=get_result()
dict=[]
min=10000000
max=-1
one=0
zero=0
for i in labels:
if i[0] == 1:
one+=1
else:
zero+=1
for i in texta:
if len(i) > max_len:
max_len = len(i)
if len(i) < min_len:
min_len = len(i)
for j in i:
if j>max:
max=j
if j<min:
min=j
dict.append(j)
for i in textb:
if len(i) > max_len:
max_len = len(i)
if len(i) < min_len:
min_len = len(i)
for j in i:
if j>max:
max=j
if j<min:
min=j
dict.append(j)
for i in resulta:
if len(i) > max_len:
max_len = len(i)
if len(i) < min_len:
min_len = len(i)
for j in i:
if j>max:
max=j
if j<min:
min=j
dict.append(j)
for i in resultb:
if len(i) > max_len:
max_len = len(i)
if len(i) < min_len:
min_len = len(i)
for j in i:
if j>max:
max=j
if j<min:
min=j
dict.append(j)
dict=set(dict)
"""
print(len(dict))
print(max)
print(min)
print(max_len)
print(min_len)
14205
51157
0
32
1
"""