This repository has been archived by the owner on Oct 22, 2021. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathcircle-packing-for-all.py
85 lines (73 loc) · 3.52 KB
/
circle-packing-for-all.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
#!/usr/bin/env python2.7
#
# Licensed to the Apache Software Foundation (ASF) under one or more
# contributor license agreements. See the NOTICE file distributed with
# this work for additional information regarding copyright ownership.
# The ASF licenses this file to You under the Apache License, Version 2.0
# (the "License"); you may not use this file except in compliance with
# the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
#
import json
import argparse
import csv
import sys
def createCluster(inputCSV,argNum):
row=[]
if(argNum not in [0,1,2]):
print("Input Error! \nPass argument to --cluster as one of the following\n0 for clustering based on x-coordinate, \n1 for clustering based on y-coordinate, \n2 for clustering based on similarity score")
sys.exit()
csvPath = inputCSV #Input Path to csv file
with open(csvPath,"r") as f:
lines = [line.strip() for line in f]
standard = lines[1].split(",")[0]
row.append("{0},{0},1".format(standard))
for line in lines:
if not "x-coordinate" in line.split(","):
if standard in line.split(","):
line_split = line.split(",")
line_split[2] = str(round(float(line_split[2]), 2))
line = ",".join(line_split)
row.append(line)
data={}
for i in range(len(row)):
if "x-coordinate" in row[i].split(","):
continue
else:
column = row[i].split(",")
data[column[argNum]]=[] #Cluster based on the argument number passed
for i in range(len(row)):
if "x-coordinate" in row[i].split(","):
continue
else:
column = row[i].split(",")
second={}
second["name"]=column[1].split('/')[-1]+' '+column[2]
second["size"]=column[2]
data[column[argNum]].append(second) #Cluster based on the argument number passed
clusterList = []
i=0
for elem in list(data.keys()):
first={}
first["name"]="Similarity: "+row[i].split(",")[2]
first["children"]=data[elem]
clusterList.append(first)
i+=1
print(json.dumps(clusterList, sort_keys=True, indent=4, separators=(',', ': ')))
clusterStruct = {"name":"clusters", "children":clusterList}
with open("circle.json", "w") as f: #Pass the json file as input to circle-packing.html
f.write(json.dumps(clusterStruct, sort_keys=True, indent=4, separators=(',', ': ')))
if __name__ == '__main__':
argParser = argparse.ArgumentParser('Edit/Cosine/Jaccard JSON Similarity Circle Packing')
argParser.add_argument('--inputCSV', required=True, help='path to directory containing CSV File, containing pair-wise similarity scores based on edit/cosine similarity distance')
argParser.add_argument('--cluster', required=True, type=int, help='Cluster based on the x-coordinate/y-coordinate/similarity score. Pass 0 for clustering based on x-coordinate, 1 for clustering based on y-coordinate, 2 for clustering based on similarity score')
args = argParser.parse_args()
createCluster(args.inputCSV, args.cluster)