aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorPjotr Prins2015-03-12 21:05:51 +0300
committerPjotr Prins2015-03-12 21:05:51 +0300
commitfa4227614042312a54a5d404af4235efc077ab3a (patch)
treef567bc66c6f2eab6aeac9ccd630bdfa275a6618b
parent494edec995a38279eb1da21d520b2cb249eb1079 (diff)
downloadgenenetwork2-fa4227614042312a54a5d404af4235efc077ab3a.tar.gz
lmm: use deep-copy to avoid side-effects
-rw-r--r--wqflask/wqflask/my_pylmm/pyLMM/runlmm.py22
1 files changed, 11 insertions, 11 deletions
diff --git a/wqflask/wqflask/my_pylmm/pyLMM/runlmm.py b/wqflask/wqflask/my_pylmm/pyLMM/runlmm.py
index e64ca0e6..d22e2912 100644
--- a/wqflask/wqflask/my_pylmm/pyLMM/runlmm.py
+++ b/wqflask/wqflask/my_pylmm/pyLMM/runlmm.py
@@ -88,29 +88,28 @@ if options.geno:
g = tsvreader.geno(options.geno)
print g.shape
-def normalizeGenotype(G):
+def normalizeGenotype(g1):
+ g = np.copy(g1) # avoid side effects
# Run for every SNP list (num individuals)
- x = True - np.isnan(G) # Matrix of True/False
- m = G[x].mean() # Global mean value
+ x = True - np.isnan(g) # Matrix of True/False
+ m = g[x].mean() # Global mean value
# print m
- s = np.sqrt(G[x].var()) # Global stddev
+ s = np.sqrt(g[x].var()) # Global stddev
# print s
- G[np.isnan(G)] = m # Plug-in mean values for missing
+ g[np.isnan(g)] = m # Plug-in mean values for missing
if s == 0:
- G = G - m # Subtract the mean
+ g = g - m # Subtract the mean
else:
- G = (G - m) / s # Normalize the deviation
- return G
+ g = (g - m) / s # Normalize the deviation
+ return g
gn = []
for snp in g:
gn.append( normalizeGenotype(snp) )
-gn = g
-
print("Before",g)
-gT = g.T
+gT = np.array(gn).T
print("After",gT)
G = np.array(gT)
print "G shape",G.shape
@@ -129,6 +128,7 @@ if cmd == 'redis':
print G
ps, ts = gn2_load_redis('testrun','other',np.array(k),y,G,options.testing)
print np.array(ps)
+ assert(options.testing and ps[0]==0.726205761108)
elif cmd == 'kinship':
gn = []
for snp in G.T: