aboutsummaryrefslogtreecommitdiff
path: root/ratspub.py
diff options
context:
space:
mode:
authorHao Chen2020-03-07 22:34:27 -0600
committerHao Chen2020-03-07 22:34:27 -0600
commitff5c5d3aff13f4f81c9b3e9a39a63e7794cb609e (patch)
tree0a0910c6733d2e3695960cbbc1e5efc17a3f488c /ratspub.py
parentcea42615bd0c0c02bad574db42fc7c44c5ca5c66 (diff)
downloadgenecup-ff5c5d3aff13f4f81c9b3e9a39a63e7794cb609e.tar.gz
Hakan fixing the count bug
Diffstat (limited to 'ratspub.py')
-rwxr-xr-xratspub.py27
1 files changed, 16 insertions, 11 deletions
diff --git a/ratspub.py b/ratspub.py
index 355bc1f..f3effad 100755
--- a/ratspub.py
+++ b/ratspub.py
@@ -56,38 +56,38 @@ def generate_nodes_json(nodes_d, nodetype):
return(nodes_json0)
def generate_edges(data, filename):
- pmid_temp=0
+ pmid_list=[]
json0=str()
edgeCnts={}
for line in data.split("\n"):
if len(line.strip())!=0:
(source, cat, target, pmid, sent) = line.split("\t")
edgeID=filename+"|"+source+"|"+target
- if (edgeID in edgeCnts) and (pmid != pmid_temp):
+ if (edgeID in edgeCnts) and (pmid+target not in pmid_list):
edgeCnts[edgeID]+=1
- pmid_temp = pmid
- elif (edgeID not in edgeCnts):
+ pmid_list.append(pmid+target)
+ elif (edgeID not in edgeCnts) and (pmid+target not in pmid_list):
edgeCnts[edgeID]=1
- pmid_temp = pmid
+ pmid_list.append(pmid+target)
for edgeID in edgeCnts:
(filename, source,target)=edgeID.split("|")
json0+="{ data: { id: '" + edgeID + "', source: '" + source + "', target: '" + target + "', sentCnt: " + str(edgeCnts[edgeID]) + ", url:'/sentences?edgeID=" + edgeID + "' } },\n"
return(json0)
def generate_edges_json(data, filename):
- pmid_temp=0
+ pmid_list=[]
edges_json0=str()
edgeCnts={}
for line in data.split("\n"):
if len(line.strip())!=0:
(source, cat, target, pmid, sent) = line.split("\t")
edgeID=filename+"|"+source+"|"+target
- if (edgeID in edgeCnts) and (pmid != pmid_temp):
+ if (edgeID in edgeCnts) and (pmid+target not in pmid_list):
edgeCnts[edgeID]+=1
- pmid_temp = pmid
- elif (edgeID not in edgeCnts):
+ pmid_list.append(pmid+target)
+ elif (edgeID not in edgeCnts) and (pmid+target not in pmid_list):
edgeCnts[edgeID]=1
- pmid_temp = pmid
+ pmid_list.append(pmid+target)
for edgeID in edgeCnts:
(filename, source,target)=edgeID.split("|")
edges_json0+="{ \"id\": \"" + edgeID + "\", \"source\": \"" + source + "\", \"target\": \"" + target + "\", \"sentCnt\": \"" + str(edgeCnts[edgeID]) + "\", \"url\":\"/sentences?edgeID=" + edgeID + "\" },\n"
@@ -160,10 +160,15 @@ nj4=generate_nodes_json(stress_d, 'stress')
nj5=generate_nodes_json(psychiatric_d, 'psychiatric')
nj6=generate_nodes_json(psychiatric_d, 'GWAS')
+
+pubmed_path="~/Dropbox/ChenLab/Hakan/RatsPub/PubMed/Archive"
+
+'''
host= os.popen('hostname').read().strip()
if host=="x1":
pubmed_path="/run/media/hao/PubMed/Archive/"
elif host=="hchen3":
pubmed_path="/media/hao/2d554499-6c5b-462d-85f3-5c49b25f4ac8/PubMed/Archive"
elif host=="penguin2":
- pubmed_path="/export2/PubMed/Archive" \ No newline at end of file
+ pubmed_path="/export2/PubMed/Archive"
+''' \ No newline at end of file