diff options
author | Hao Chen | 2020-03-07 22:34:27 -0600 |
---|---|---|
committer | Hao Chen | 2020-03-07 22:34:27 -0600 |
commit | ff5c5d3aff13f4f81c9b3e9a39a63e7794cb609e (patch) | |
tree | 0a0910c6733d2e3695960cbbc1e5efc17a3f488c /ratspub.py | |
parent | cea42615bd0c0c02bad574db42fc7c44c5ca5c66 (diff) | |
download | genecup-ff5c5d3aff13f4f81c9b3e9a39a63e7794cb609e.tar.gz |
Hakan fixing the count bug
Diffstat (limited to 'ratspub.py')
-rwxr-xr-x | ratspub.py | 27 |
1 files changed, 16 insertions, 11 deletions
@@ -56,38 +56,38 @@ def generate_nodes_json(nodes_d, nodetype): return(nodes_json0) def generate_edges(data, filename): - pmid_temp=0 + pmid_list=[] json0=str() edgeCnts={} for line in data.split("\n"): if len(line.strip())!=0: (source, cat, target, pmid, sent) = line.split("\t") edgeID=filename+"|"+source+"|"+target - if (edgeID in edgeCnts) and (pmid != pmid_temp): + if (edgeID in edgeCnts) and (pmid+target not in pmid_list): edgeCnts[edgeID]+=1 - pmid_temp = pmid - elif (edgeID not in edgeCnts): + pmid_list.append(pmid+target) + elif (edgeID not in edgeCnts) and (pmid+target not in pmid_list): edgeCnts[edgeID]=1 - pmid_temp = pmid + pmid_list.append(pmid+target) for edgeID in edgeCnts: (filename, source,target)=edgeID.split("|") json0+="{ data: { id: '" + edgeID + "', source: '" + source + "', target: '" + target + "', sentCnt: " + str(edgeCnts[edgeID]) + ", url:'/sentences?edgeID=" + edgeID + "' } },\n" return(json0) def generate_edges_json(data, filename): - pmid_temp=0 + pmid_list=[] edges_json0=str() edgeCnts={} for line in data.split("\n"): if len(line.strip())!=0: (source, cat, target, pmid, sent) = line.split("\t") edgeID=filename+"|"+source+"|"+target - if (edgeID in edgeCnts) and (pmid != pmid_temp): + if (edgeID in edgeCnts) and (pmid+target not in pmid_list): edgeCnts[edgeID]+=1 - pmid_temp = pmid - elif (edgeID not in edgeCnts): + pmid_list.append(pmid+target) + elif (edgeID not in edgeCnts) and (pmid+target not in pmid_list): edgeCnts[edgeID]=1 - pmid_temp = pmid + pmid_list.append(pmid+target) for edgeID in edgeCnts: (filename, source,target)=edgeID.split("|") edges_json0+="{ \"id\": \"" + edgeID + "\", \"source\": \"" + source + "\", \"target\": \"" + target + "\", \"sentCnt\": \"" + str(edgeCnts[edgeID]) + "\", \"url\":\"/sentences?edgeID=" + edgeID + "\" },\n" @@ -160,10 +160,15 @@ nj4=generate_nodes_json(stress_d, 'stress') nj5=generate_nodes_json(psychiatric_d, 'psychiatric') nj6=generate_nodes_json(psychiatric_d, 'GWAS') + +pubmed_path="~/Dropbox/ChenLab/Hakan/RatsPub/PubMed/Archive" + +''' host= os.popen('hostname').read().strip() if host=="x1": pubmed_path="/run/media/hao/PubMed/Archive/" elif host=="hchen3": pubmed_path="/media/hao/2d554499-6c5b-462d-85f3-5c49b25f4ac8/PubMed/Archive" elif host=="penguin2": - pubmed_path="/export2/PubMed/Archive"
\ No newline at end of file + pubmed_path="/export2/PubMed/Archive" +'''
\ No newline at end of file |