-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathenumerate.py
More file actions
62 lines (45 loc) · 1.3 KB
/
enumerate.py
File metadata and controls
62 lines (45 loc) · 1.3 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
import sys
if __name__ == '__main__':
dataset = sys.argv[1]
filer = open(dataset, 'r')
datastr = filer.readlines()
print(datastr[0])
print(type(datastr[0]))
data = []
for line in datastr:
data.append(line.split(','))
print(data[0])
idx = 1
seen_first = {}
for items in data:
for item in items:
if item not in seen_first:
seen_first[item] = idx
idx += 1
print('Mapping:', seen_first)
data_enumerated = []
for items in data:
to_append = []
for item in items:
to_append.append(seen_first[item])
data_enumerated.append(to_append)
'''
print('Remap check:')
for i in range(20):
print('Record %d'%i)
print(data[i])
print(data_enumerated[i])
'''
##Write back##
write_name = dataset + '_enum'
writer = open(write_name, 'w+')
writer.write(str(len(data_enumerated)) + '\t' + str(len(data_enumerated[0])))
writer.write('\n')
for items in data_enumerated:
for i in range (len(items)):
if(i != len(items) -1):
writer.write(str(items[i]))
writer.write('\t')
else:
writer.write(str(items[i]))
writer.write('\n')