aboutsummaryrefslogtreecommitdiff
path: root/wqflask/maintenance/dataset/correlations.py
diff options
context:
space:
mode:
authorLei Yan2014-02-03 12:28:08 -0600
committerLei Yan2014-02-03 12:28:08 -0600
commitb462fae9df948dbf35232a764d61fbf10c930e82 (patch)
treeabadc34dc66b7fdf53adba9b6505ea327ba2a71f /wqflask/maintenance/dataset/correlations.py
parentc1bd0f562b5249b9a6911e3873dad8dd853aaab7 (diff)
downloadgenenetwork2-b462fae9df948dbf35232a764d61fbf10c930e82.tar.gz
On branch master
Diffstat (limited to 'wqflask/maintenance/dataset/correlations.py')
-rw-r--r--wqflask/maintenance/dataset/correlations.py47
1 files changed, 47 insertions, 0 deletions
diff --git a/wqflask/maintenance/dataset/correlations.py b/wqflask/maintenance/dataset/correlations.py
new file mode 100644
index 00000000..b089e446
--- /dev/null
+++ b/wqflask/maintenance/dataset/correlations.py
@@ -0,0 +1,47 @@
+# Author: Lei Yan
+# Create Date: 2014-01-21
+# Last Update Date: 2014-01-24
+
+# import
+import sys
+import os
+import re
+import MySQLdb
+import ConfigParser
+
+def main(argv):
+
+ # load configuration from configuration file
+ config = ConfigParser.ConfigParser()
+ config.read(argv[1])
+ genofile = config.get('configuration', 'genofile')
+
+ # parse genofile
+ genotypes = []
+ file_geno = open(genofile, 'r')
+ for line in file_geno:
+ line = line.strip()
+ if line.startswith('#'):
+ continue
+ if line.startswith('@'):
+ continue
+ cells = line.split()
+ if line.startswith("Chr"):
+ strains = cells[4:]
+ continue
+ genotype = {}
+ genotype['chr'] = cells[0]
+ genotype['locus'] = cells[1]
+ genotype['cm'] = cells[2]
+ genotype['mb'] = cells[3]
+ genotype['values'] = cells[4:]
+ genotypes.append(genotype)
+ print "get %d strains:\t%s" % (len(strains), strains)
+ print "load %d genotypes" % len(genotypes)
+
+ # phenotypes
+
+# main
+if __name__ == "__main__":
+ main(sys.argv)
+ print "exit successfully"