aboutsummaryrefslogtreecommitdiff
path: root/gn3/computations/correlations.py
diff options
context:
space:
mode:
Diffstat (limited to 'gn3/computations/correlations.py')
-rw-r--r--gn3/computations/correlations.py39
1 files changed, 38 insertions, 1 deletions
diff --git a/gn3/computations/correlations.py b/gn3/computations/correlations.py
index fb62b56..90b6c8c 100644
--- a/gn3/computations/correlations.py
+++ b/gn3/computations/correlations.py
@@ -128,7 +128,7 @@ def compute_all_sample_correlation(this_trait,
corr_results = []
processed_values = []
for target_trait in target_dataset:
- # trait_id = target_trait.get("trait_id")
+ # trait_name = target_trait.get("trait_id")
target_trait_data = target_trait["trait_sample_data"]
# this_vals, target_vals = filter_shared_sample_keys(
# this_trait_samples, target_trait_data)
@@ -152,6 +152,43 @@ def compute_all_sample_correlation(this_trait,
return corr_results
+ def benchmark_compute_all_sample(this_trait,
+ target_datasets,
+ corr_method="pearson") ->List:
+ """Temp function to benchmark with compute_all_sample_r
+ """
+
+ this_trait_samples = this_trait["trait_sample_data"]
+
+ corr_results = []
+
+ for target_trait in target_dataset:
+ trait_id = target_trait.get("trait_id")
+ target_trait_data = target_trait["trait_sample_data"]
+ this_vals, target_vals = filter_shared_sample_keys(
+ this_trait_samples, target_trait_data)
+
+ sample_correlation = compute_sample_r_correlation(
+ corr_method=corr_method,
+ trait_vals=this_vals,
+ target_samples_vals=target_vals)
+
+ if sample_correlation is not None:
+ (corr_coeffient, p_value, num_overlap) = sample_correlation
+
+ else:
+ continue
+
+ corr_result = {
+ "corr_coeffient": corr_coeffient,
+ "p_value": p_value,
+ "num_overlap": num_overlap
+ }
+
+ corr_results.append({trait_id: corr_result})
+
+ return corr_results
+
def tissue_lit_corr_for_probe_type(corr_type: str, top_corr_results):
"""Function that does either lit_corr_for_trait_list or tissue_corr _for_trait