-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathread_version_json.py
More file actions
55 lines (45 loc) · 1.08 KB
/
read_version_json.py
File metadata and controls
55 lines (45 loc) · 1.08 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
import json
filename = 'parsed_enhanced_logs.json'
with open(filename) as f:
data = json.load(f)
version_dict = set()
for entry in data:
version_dict.add(entry['version'].replace("MAPREDUCE", "hadoop").replace("HDFS", "hadoop"))
print(len(version_dict))
print(version_dict)
version_list=list(set(version_dict))
version_list.sort()
print(len(version_list))
print(version_list)
folders = [
"cassandra-0.6.5",
"cassandra-0.7.0-beta1",
"cassandra-0.8.0-beta1",
"cassandra-1.0.0-rc2",
"cassandra-1.2.0",
"cassandra-2.0.0",
"hadoop-0.21.0",
"hadoop-0.22.0",
"hadoop-0.23.0",
"hadoop-0.23.0",
"hadoop-1.2.0",
"hadoop-2.0.0-alpha",
"hadoop-2.1.1-beta",
"hadoop-2.2.0",
"hadoop-2.3.0",
"hadoop-2.6.0",
"hbase-0.90.0",
"hbase-0.92.0",
"hbase-0.94.0",
"hbase-0.95.0",
"hbase-0.96.1",
"hbase-0.98.0",
"zookeeper-3.5.0",
"zookeeper-3.3.0"
]
print(len(folders))
for item in version_list:
if item in folders:
version_list.remove(item)
print(len(version_list))
print(version_list)