aboutsummaryrefslogtreecommitdiff
path: root/gn3
diff options
context:
space:
mode:
Diffstat (limited to 'gn3')
-rw-r--r--gn3/api/gemma.py402
-rw-r--r--gn3/computations/gemma.py7
2 files changed, 213 insertions, 196 deletions
diff --git a/gn3/api/gemma.py b/gn3/api/gemma.py
index a341f62..d82f5a5 100644
--- a/gn3/api/gemma.py
+++ b/gn3/api/gemma.py
@@ -24,8 +24,7 @@ gemma = Blueprint("gemma", __name__)
def get_version():
"""Display the installed version of gemma-wrapper"""
gemma_cmd = current_app.config["GEMMA_WRAPPER_CMD"]
- return jsonify(
- run_cmd(f"{gemma_cmd} -v | head -n 1"))
+ return jsonify(run_cmd(f"{gemma_cmd} -v | head -n 1"))
# This is basically extracted from genenetwork2
@@ -39,19 +38,21 @@ file output is returned.
"""
data = request.get_json()
app_defaults = current_app.config
- __hash = generate_hash_of_string(
- f"{data.get('genofile_name')}_"
- ''.join(data.get("values", "")))
+ __hash = generate_hash_of_string(f"{data.get('genofile_name')}_"
+ ''.join(data.get("values", "")))
gemma_kwargs = {
- "geno_filename": os.path.join(app_defaults.get("GENODIR"), "bimbam",
- f"{data.get('geno_filename')}"),
- "trait_filename": generate_pheno_txt_file(
+ "geno_filename":
+ os.path.join(app_defaults.get("GENODIR"), "bimbam",
+ f"{data.get('geno_filename')}"),
+ "trait_filename":
+ generate_pheno_txt_file(
tmpdir=app_defaults.get("TMPDIR"),
values=data.get("values"),
# Generate this file on the fly!
trait_filename=(f"{data.get('dataset_groupname')}_"
f"{data.get('trait_name')}_"
- f"{__hash}.txt"))}
+ f"{__hash}.txt"))
+ }
gemma_wrapper_kwargs = {}
if data.get("loco"):
gemma_wrapper_kwargs["loco"] = f"--input {data.get('loco')}"
@@ -74,14 +75,14 @@ file output is returned.
if not all([k_computation_cmd, gwa_cmd]):
return jsonify(status=128,
error="Unable to generate cmds for computation!"), 500
- return jsonify(
- unique_id=queue_cmd(conn=redis.Redis(),
- email=data.get("email"),
- job_queue=app_defaults.get("REDIS_JOB_QUEUE"),
- cmd=f"{k_computation_cmd} && {gwa_cmd}"),
- status="queued",
- output_file=(f"{data.get('dataset_name')}_GWA_"
- f"{__hash}.txt"))
+ return jsonify(unique_id=queue_cmd(
+ conn=redis.Redis(),
+ email=data.get("email"),
+ job_queue=app_defaults.get("REDIS_JOB_QUEUE"),
+ cmd=f"{k_computation_cmd} && {gwa_cmd}"),
+ status="queued",
+ output_file=(f"{data.get('dataset_name')}_GWA_"
+ f"{__hash}.txt"))
@gemma.route("/status/<unique_id>", methods=["GET"])
@@ -90,8 +91,7 @@ def check_cmd_status(unique_id):
gemma endpoints, return the status of the command
"""
- status = redis.Redis().hget(name=unique_id,
- key="status")
+ status = redis.Redis().hget(name=unique_id, key="status")
if not status:
return jsonify(status=128,
error="The unique id you used does not exist!"), 500
@@ -105,39 +105,40 @@ and return <hash-of-inputs>.json with a UNIQUE-ID of the job. The genofile,
traitfile, and snpsfile are extracted from a metadata.json file.
"""
- working_dir = os.path.join(current_app.config.get("TMPDIR"),
- token)
- _dict = jsonfile_to_dict(os.path.join(working_dir,
- "metadata.json"))
+ working_dir = os.path.join(current_app.config.get("TMPDIR"), token)
+ _dict = jsonfile_to_dict(os.path.join(working_dir, "metadata.json"))
try:
- genofile, phenofile, snpsfile = [os.path.join(working_dir,
- _dict.get(x))
- for x in ["geno", "pheno", "snps"]]
+ genofile, phenofile, snpsfile = [
+ os.path.join(working_dir, _dict.get(x))
+ for x in ["geno", "pheno", "snps"]
+ ]
if not do_paths_exist([genofile, phenofile, snpsfile]):
raise FileNotFoundError
gemma_kwargs = {"g": genofile, "p": phenofile, "a": snpsfile}
_hash = get_hash_of_files([genofile, phenofile, snpsfile])
k_output_filename = f"{_hash}-k-output.json"
- return jsonify(
- unique_id=queue_cmd(
- conn=redis.Redis(),
- email=(request.get_json() or {}).get('email'),
- job_queue=current_app.config.get("REDIS_JOB_QUEUE"),
- cmd=compose_gemma_cmd(
- gemma_wrapper_cmd=current_app.config.get("GEMMA_"
- "WRAPPER_CMD"),
- gemma_wrapper_kwargs=None,
- gemma_kwargs=gemma_kwargs,
- gemma_args=["-gk", ">",
- (f"{current_app.config.get('TMPDIR')}/"
- f"{token}/{k_output_filename}")])),
- status="queued",
- output_file=k_output_filename)
+ return jsonify(unique_id=queue_cmd(
+ conn=redis.Redis(),
+ email=(request.get_json() or {}).get('email'),
+ job_queue=current_app.config.get("REDIS_JOB_QUEUE"),
+ cmd=compose_gemma_cmd(gemma_wrapper_cmd=current_app.config.get(
+ "GEMMA_"
+ "WRAPPER_CMD"),
+ gemma_wrapper_kwargs=None,
+ gemma_kwargs=gemma_kwargs,
+ gemma_args=[
+ "-gk", ">",
+ (f"{current_app.config.get('TMPDIR')}/"
+ f"{token}/{k_output_filename}")
+ ])),
+ status="queued",
+ output_file=k_output_filename)
# pylint: disable=W0703
except Exception:
- return jsonify(status=128,
- # use better message
- message="Metadata file non-existent!")
+ return jsonify(
+ status=128,
+ # use better message
+ message="Metadata file non-existent!")
@gemma.route("/k-compute/loco/<chromosomes>/<token>", methods=["POST"])
@@ -146,39 +147,40 @@ def compute_k_loco(chromosomes, token):
values.
"""
- working_dir = os.path.join(current_app.config.get("TMPDIR"),
- token)
- _dict = jsonfile_to_dict(os.path.join(working_dir,
- "metadata.json"))
+ working_dir = os.path.join(current_app.config.get("TMPDIR"), token)
+ _dict = jsonfile_to_dict(os.path.join(working_dir, "metadata.json"))
try:
- genofile, phenofile, snpsfile = [os.path.join(working_dir,
- _dict.get(x))
- for x in ["geno", "pheno", "snps"]]
+ genofile, phenofile, snpsfile = [
+ os.path.join(working_dir, _dict.get(x))
+ for x in ["geno", "pheno", "snps"]
+ ]
if not do_paths_exist([genofile, phenofile, snpsfile]):
raise FileNotFoundError
gemma_kwargs = {"g": genofile, "p": phenofile, "a": snpsfile}
_hash = get_hash_of_files([genofile, phenofile, snpsfile])
k_output_filename = f"{_hash}-k-output.json"
- return jsonify(
- unique_id=queue_cmd(
- conn=redis.Redis(),
- email=(request.get_json() or {}).get('email'),
- job_queue=current_app.config.get("REDIS_JOB_QUEUE"),
- cmd=compose_gemma_cmd(
- gemma_wrapper_cmd=current_app.config.get("GEMMA_"
- "WRAPPER_CMD"),
- gemma_wrapper_kwargs={"loco": f"--input {chromosomes}"},
- gemma_kwargs=gemma_kwargs,
- gemma_args=["-gk", ">",
- (f"{current_app.config.get('TMPDIR')}/"
- f"{token}/{k_output_filename}")])),
- status="queued",
- output_file=k_output_filename)
+ return jsonify(unique_id=queue_cmd(
+ conn=redis.Redis(),
+ email=(request.get_json() or {}).get('email'),
+ job_queue=current_app.config.get("REDIS_JOB_QUEUE"),
+ cmd=compose_gemma_cmd(
+ gemma_wrapper_cmd=current_app.config.get("GEMMA_"
+ "WRAPPER_CMD"),
+ gemma_wrapper_kwargs={"loco": f"--input {chromosomes}"},
+ gemma_kwargs=gemma_kwargs,
+ gemma_args=[
+ "-gk", ">",
+ (f"{current_app.config.get('TMPDIR')}/"
+ f"{token}/{k_output_filename}")
+ ])),
+ status="queued",
+ output_file=k_output_filename)
# pylint: disable=W0703
except Exception:
- return jsonify(status=128,
- # use better message
- message="Metadata file non-existent!")
+ return jsonify(
+ status=128,
+ # use better message
+ message="Metadata file non-existent!")
@gemma.route("/gwa-compute/<k_filename>/<token>", methods=["POST"])
@@ -186,41 +188,46 @@ def compute_gwa(k_filename, token):
"""Compute GWA values. No loco no covariates provided.
"""
- working_dir = os.path.join(current_app.config.get("TMPDIR"),
- token)
- _dict = jsonfile_to_dict(os.path.join(working_dir,
- "metadata.json"))
+ working_dir = os.path.join(current_app.config.get("TMPDIR"), token)
+ _dict = jsonfile_to_dict(os.path.join(working_dir, "metadata.json"))
try:
genofile, phenofile, snpsfile = [
- os.path.join(working_dir,
- _dict.get(x))
- for x in ["geno", "pheno", "snps"]]
- gemma_kwargs = {"g": genofile, "p": phenofile,
- "a": snpsfile, "lmm": _dict.get("lmm", 9)}
+ os.path.join(working_dir, _dict.get(x))
+ for x in ["geno", "pheno", "snps"]
+ ]
+ gemma_kwargs = {
+ "g": genofile,
+ "p": phenofile,
+ "a": snpsfile,
+ "lmm": _dict.get("lmm", 9)
+ }
_hash = get_hash_of_files([genofile, phenofile, snpsfile])
_output_filename = f"{_hash}-gwa-output.json"
- return jsonify(
- unique_id=queue_cmd(
- conn=redis.Redis(),
- email=(request.get_json() or {}).get('email'),
- job_queue=current_app.config.get("REDIS_JOB_QUEUE"),
- cmd=compose_gemma_cmd(
- gemma_wrapper_cmd=current_app.config.get("GEMMA_"
- "WRAPPER_CMD"),
- gemma_wrapper_kwargs={
- "input": os.path.join(working_dir, k_filename)
- },
- gemma_kwargs=gemma_kwargs,
- gemma_args=["gk", ">",
- (f"{current_app.config.get('TMPDIR')}/"
- f"{token}/{_output_filename}")])),
- status="queued",
- output_file=_output_filename)
+ return jsonify(unique_id=queue_cmd(
+ conn=redis.Redis(),
+ email=(request.get_json() or {}).get('email'),
+ job_queue=current_app.config.get("REDIS_JOB_QUEUE"),
+ cmd=compose_gemma_cmd(gemma_wrapper_cmd=current_app.config.get(
+ "GEMMA_"
+ "WRAPPER_CMD"),
+ gemma_wrapper_kwargs={
+ "input":
+ os.path.join(working_dir, k_filename)
+ },
+ gemma_kwargs=gemma_kwargs,
+ gemma_args=[
+ "gk", ">",
+ (f"{current_app.config.get('TMPDIR')}/"
+ f"{token}/{_output_filename}")
+ ])),
+ status="queued",
+ output_file=_output_filename)
# pylint: disable=W0703
except Exception:
- return jsonify(status=128,
- # use better message
- message="Metadata file non-existent!")
+ return jsonify(
+ status=128,
+ # use better message
+ message="Metadata file non-existent!")
@gemma.route("/gwa-compute/covars/<k_filename>/<token>", methods=["POST"])
@@ -228,42 +235,47 @@ def compute_gwa_with_covar(k_filename, token):
"""Compute GWA values. Covariates provided.
"""
- working_dir = os.path.join(current_app.config.get("TMPDIR"),
- token)
- _dict = jsonfile_to_dict(os.path.join(working_dir,
- "metadata.json"))
+ working_dir = os.path.join(current_app.config.get("TMPDIR"), token)
+ _dict = jsonfile_to_dict(os.path.join(working_dir, "metadata.json"))
try:
genofile, phenofile, snpsfile, covarfile = [
- os.path.join(working_dir,
- _dict.get(x))
- for x in ["geno", "pheno", "snps", "covar"]]
- gemma_kwargs = {"g": genofile, "p": phenofile,
- "a": snpsfile, "c": covarfile,
- "lmm": _dict.get("lmm", 9)}
+ os.path.join(working_dir, _dict.get(x))
+ for x in ["geno", "pheno", "snps", "covar"]
+ ]
+ gemma_kwargs = {
+ "g": genofile,
+ "p": phenofile,
+ "a": snpsfile,
+ "c": covarfile,
+ "lmm": _dict.get("lmm", 9)
+ }
_hash = get_hash_of_files([genofile, phenofile, snpsfile, covarfile])
_output_filename = f"{_hash}-gwa-output.json"
- return jsonify(
- unique_id=queue_cmd(
- conn=redis.Redis(),
- email=(request.get_json() or {}).get('email'),
- job_queue=current_app.config.get("REDIS_JOB_QUEUE"),
- cmd=compose_gemma_cmd(
- gemma_wrapper_cmd=current_app.config.get("GEMMA_"
- "WRAPPER_CMD"),
- gemma_wrapper_kwargs={
- "input": os.path.join(working_dir, k_filename)
- },
- gemma_kwargs=gemma_kwargs,
- gemma_args=["-gk", ">",
- (f"{current_app.config.get('TMPDIR')}/"
- f"{token}/{_output_filename}")])),
- status="queued",
- output_file=_output_filename)
+ return jsonify(unique_id=queue_cmd(
+ conn=redis.Redis(),
+ email=(request.get_json() or {}).get('email'),
+ job_queue=current_app.config.get("REDIS_JOB_QUEUE"),
+ cmd=compose_gemma_cmd(gemma_wrapper_cmd=current_app.config.get(
+ "GEMMA_"
+ "WRAPPER_CMD"),
+ gemma_wrapper_kwargs={
+ "input":
+ os.path.join(working_dir, k_filename)
+ },
+ gemma_kwargs=gemma_kwargs,
+ gemma_args=[
+ "-gk", ">",
+ (f"{current_app.config.get('TMPDIR')}/"
+ f"{token}/{_output_filename}")
+ ])),
+ status="queued",
+ output_file=_output_filename)
# pylint: disable=W0703
except Exception:
- return jsonify(status=128,
- # use better message
- message="Metadata file non-existent!")
+ return jsonify(
+ status=128,
+ # use better message
+ message="Metadata file non-existent!")
@gemma.route("/gwa-compute/<k_filename>/loco/maf/<maf>/<token>",
@@ -272,45 +284,49 @@ def compute_gwa_with_loco_maf(k_filename, maf, token):
"""Compute GWA values. No Covariates provided. Only loco and maf vals given.
"""
- working_dir = os.path.join(current_app.config.get("TMPDIR"),
- token)
- _dict = jsonfile_to_dict(os.path.join(working_dir,
- "metadata.json"))
+ working_dir = os.path.join(current_app.config.get("TMPDIR"), token)
+ _dict = jsonfile_to_dict(os.path.join(working_dir, "metadata.json"))
try:
genofile, phenofile, snpsfile = [
- os.path.join(working_dir,
- _dict.get(x))
- for x in ["geno", "pheno", "snps"]]
+ os.path.join(working_dir, _dict.get(x))
+ for x in ["geno", "pheno", "snps"]
+ ]
if not do_paths_exist([genofile, phenofile, snpsfile]):
raise FileNotFoundError
- gemma_kwargs = {"g": genofile, "p": phenofile,
- "a": snpsfile, "lmm": _dict.get("lmm", 9),
- 'maf': float(maf)}
+ gemma_kwargs = {
+ "g": genofile,
+ "p": phenofile,
+ "a": snpsfile,
+ "lmm": _dict.get("lmm", 9),
+ 'maf': float(maf)
+ }
_hash = get_hash_of_files([genofile, phenofile, snpsfile])
_output_filename = f"{_hash}-gwa-output.json"
- return jsonify(
- unique_id=queue_cmd(
- conn=redis.Redis(),
- email=(request.get_json() or {}).get('email'),
- job_queue=current_app.config.get("REDIS_JOB_QUEUE"),
- cmd=compose_gemma_cmd(
- gemma_wrapper_cmd=current_app.config.get("GEMMA_"
- "WRAPPER_CMD"),
- gemma_wrapper_kwargs={
- "loco": ("--input "
- f"{os.path.join(working_dir, k_filename)}")
- },
- gemma_kwargs=gemma_kwargs,
- gemma_args=["-gk", ">",
- (f"{current_app.config.get('TMPDIR')}/"
- f"{token}/{_output_filename}")])),
- status="queued",
- output_file=_output_filename)
+ return jsonify(unique_id=queue_cmd(
+ conn=redis.Redis(),
+ email=(request.get_json() or {}).get('email'),
+ job_queue=current_app.config.get("REDIS_JOB_QUEUE"),
+ cmd=compose_gemma_cmd(
+ gemma_wrapper_cmd=current_app.config.get("GEMMA_"
+ "WRAPPER_CMD"),
+ gemma_wrapper_kwargs={
+ "loco": ("--input "
+ f"{os.path.join(working_dir, k_filename)}")
+ },
+ gemma_kwargs=gemma_kwargs,
+ gemma_args=[
+ "-gk", ">",
+ (f"{current_app.config.get('TMPDIR')}/"
+ f"{token}/{_output_filename}")
+ ])),
+ status="queued",
+ output_file=_output_filename)
# pylint: disable=W0703
except Exception:
- return jsonify(status=128,
- # use better message
- message="Metadata file non-existent!")
+ return jsonify(
+ status=128,
+ # use better message
+ message="Metadata file non-existent!")
@gemma.route("/gwa-compute/<k_filename>/loco/covariates/maf/<maf>/<token>",
@@ -319,43 +335,47 @@ def compute_gwa_with_loco_covar(k_filename, maf, token):
"""Compute GWA values. No Covariates provided. Only loco and maf vals given.
"""
- working_dir = os.path.join(current_app.config.get("TMPDIR"),
- token)
- _dict = jsonfile_to_dict(os.path.join(working_dir,
- "metadata.json"))
+ working_dir = os.path.join(current_app.config.get("TMPDIR"), token)
+ _dict = jsonfile_to_dict(os.path.join(working_dir, "metadata.json"))
try:
genofile, phenofile, snpsfile, covarfile = [
- os.path.join(working_dir,
- _dict.get(x))
- for x in ["geno", "pheno", "snps", "covar"]]
+ os.path.join(working_dir, _dict.get(x))
+ for x in ["geno", "pheno", "snps", "covar"]
+ ]
if not do_paths_exist([genofile, phenofile, snpsfile, covarfile]):
raise FileNotFoundError
- gemma_kwargs = {"g": genofile, "p": phenofile,
- "a": snpsfile, "c": covarfile,
- "lmm": _dict.get("lmm", 9),
- "maf": float(maf)}
+ gemma_kwargs = {
+ "g": genofile,
+ "p": phenofile,
+ "a": snpsfile,
+ "c": covarfile,
+ "lmm": _dict.get("lmm", 9),
+ "maf": float(maf)
+ }
_hash = get_hash_of_files([genofile, phenofile, snpsfile, covarfile])
_output_filename = f"{_hash}-gwa-output.json"
- return jsonify(
- unique_id=queue_cmd(
- conn=redis.Redis(),
- email=(request.get_json() or {}).get('email'),
- job_queue=current_app.config.get("REDIS_JOB_QUEUE"),
- cmd=compose_gemma_cmd(
- gemma_wrapper_cmd=current_app.config.get("GEMMA_"
- "WRAPPER_CMD"),
- gemma_wrapper_kwargs={
- "loco": ("--input "
- f"{os.path.join(working_dir, k_filename)}")
- },
- gemma_kwargs=gemma_kwargs,
- gemma_args=["-gk", ">",
- (f"{current_app.config.get('TMPDIR')}/"
- f"{token}/{_output_filename}")])),
- status="queued",
- output_file=_output_filename)
+ return jsonify(unique_id=queue_cmd(
+ conn=redis.Redis(),
+ email=(request.get_json() or {}).get('email'),
+ job_queue=current_app.config.get("REDIS_JOB_QUEUE"),
+ cmd=compose_gemma_cmd(
+ gemma_wrapper_cmd=current_app.config.get("GEMMA_"
+ "WRAPPER_CMD"),
+ gemma_wrapper_kwargs={
+ "loco": ("--input "
+ f"{os.path.join(working_dir, k_filename)}")
+ },
+ gemma_kwargs=gemma_kwargs,
+ gemma_args=[
+ "-gk", ">",
+ (f"{current_app.config.get('TMPDIR')}/"
+ f"{token}/{_output_filename}")
+ ])),
+ status="queued",
+ output_file=_output_filename)
# pylint: disable=W0703
except Exception:
- return jsonify(status=128,
- # use better message
- message="Metadata file non-existent!")
+ return jsonify(
+ status=128,
+ # use better message
+ message="Metadata file non-existent!")
diff --git a/gn3/computations/gemma.py b/gn3/computations/gemma.py
index 7ee70b0..7b5f91d 100644
--- a/gn3/computations/gemma.py
+++ b/gn3/computations/gemma.py
@@ -49,9 +49,7 @@ def do_paths_exist(paths: ValuesView) -> bool:
def generate_gemma_computation_cmd(
- gemma_cmd: str,
- gemma_kwargs: Dict[str, str],
- output_file: str,
+ gemma_cmd: str, gemma_kwargs: Dict[str, str], output_file: str,
gemma_wrapper_kwargs: Dict[str, str]) -> Optional[str]:
"""Create a computation cmd"""
geno_filename = gemma_kwargs.get("geno_filename", "")
@@ -69,5 +67,4 @@ def generate_gemma_computation_cmd(
return compose_gemma_cmd(gemma_wrapper_cmd=gemma_cmd,
gemma_wrapper_kwargs=gemma_wrapper_kwargs,
gemma_kwargs=_kwargs,
- gemma_args=["-gk", ">",
- output_file])
+ gemma_args=["-gk", ">", output_file])