"""Views handling ('classical') phenotypes.""" import sys import uuid import json import datetime from pathlib import Path from functools import wraps from logging import INFO, ERROR, DEBUG, FATAL, CRITICAL, WARNING from redis import Redis from requests.models import Response from MySQLdb.cursors import DictCursor from gn_libs.mysqldb import database_connection from flask import (flash, request, url_for, redirect, Blueprint, current_app as app) # from r_qtl import r_qtl2 as rqtl2 from r_qtl import r_qtl2_qc as rqc from r_qtl import exceptions as rqe from uploader import jobs from uploader.files import save_file#, fullpath from uploader.ui import make_template_renderer from uploader.oauth2.client import oauth2_post from uploader.authorisation import require_login from uploader.species.models import all_species, species_by_id from uploader.monadic_requests import make_either_error_handler from uploader.request_checks import with_species, with_population from uploader.datautils import safe_int, order_by_family, enumerate_sequence from uploader.population.models import (populations_by_species, population_by_species_and_id) from uploader.input_validation import (encode_errors, decode_errors, is_valid_representative_name) from .models import (dataset_by_id, phenotype_by_id, phenotypes_count, save_new_dataset, dataset_phenotypes, datasets_by_population) phenotypesbp = Blueprint("phenotypes", __name__) render_template = make_template_renderer("phenotypes") @phenotypesbp.route("/phenotypes", methods=["GET"]) @require_login def index(): """Direct entry-point for phenotypes data handling.""" with database_connection(app.config["SQL_URI"]) as conn: if not bool(request.args.get("species_id")): return render_template("phenotypes/index.html", species=order_by_family(all_species(conn)), activelink="phenotypes") species = species_by_id(conn, request.args.get("species_id")) if not bool(species): flash("No such species!", "alert-danger") return redirect(url_for("species.populations.phenotypes.index")) return redirect(url_for("species.populations.phenotypes.select_population", species_id=species["SpeciesId"])) @phenotypesbp.route("<int:species_id>/phenotypes/select-population", methods=["GET"]) @require_login @with_species(redirect_uri="species.populations.phenotypes.index") def select_population(species: dict, **kwargs):# pylint: disable=[unused-argument] """Select the population for your phenotypes.""" with database_connection(app.config["SQL_URI"]) as conn: if not bool(request.args.get("population_id")): return render_template("phenotypes/select-population.html", species=species, populations=order_by_family( populations_by_species( conn, species["SpeciesId"]), order_key="FamilyOrder"), activelink="phenotypes") population = population_by_species_and_id( conn, species["SpeciesId"], int(request.args["population_id"])) if not bool(population): flash("No such population found!", "alert-danger") return redirect(url_for( "species.populations.phenotypes.select_population", species_id=species["SpeciesId"])) return redirect(url_for("species.populations.phenotypes.list_datasets", species_id=species["SpeciesId"], population_id=population["Id"])) @phenotypesbp.route( "<int:species_id>/populations/<int:population_id>/phenotypes/datasets", methods=["GET"]) @require_login @with_population(species_redirect_uri="species.populations.phenotypes.index", redirect_uri="species.populations.phenotypes.select_population") def list_datasets(species: dict, population: dict, **kwargs):# pylint: disable=[unused-argument] """List available phenotype datasets.""" with database_connection(app.config["SQL_URI"]) as conn: datasets = datasets_by_population( conn, species["SpeciesId"], population["Id"]) if len(datasets) == 1: return redirect(url_for( "species.populations.phenotypes.view_dataset", species_id=species["SpeciesId"], population_id=population["Id"], dataset_id=datasets[0]["Id"])) return render_template("phenotypes/list-datasets.html", species=species, population=population, datasets=datasets, activelink="list-datasets") def with_dataset( species_redirect_uri: str, population_redirect_uri: str, redirect_uri: str ): """Ensure the dataset actually exists.""" def __decorator__(func): @wraps(func) @with_population(species_redirect_uri, population_redirect_uri) def __with_dataset__(**kwargs): try: _spcid = int(kwargs["species_id"]) _popid = int(kwargs["population_id"]) _dsetid = int(kwargs.get("dataset_id")) select_dataset_uri = redirect(url_for( redirect_uri, species_id=_spcid, population_id=_popid)) if not bool(_dsetid): flash("You need to select a valid 'dataset_id' value.", "alert-danger") return select_dataset_uri with database_connection(app.config["SQL_URI"]) as conn: dataset = dataset_by_id(conn, _spcid, _popid, _dsetid) if not bool(dataset): flash("You must select a valid dataset.", "alert-danger") return select_dataset_uri except ValueError as _verr: app.logger.debug( "Exception converting 'dataset_id' to integer: %s", kwargs.get("dataset_id"), exc_info=True) flash("Expected 'dataset_id' value to be an integer." "alert-danger") return select_dataset_uri return func(dataset=dataset, **kwargs) return __with_dataset__ return __decorator__ @phenotypesbp.route( "<int:species_id>/populations/<int:population_id>/phenotypes/datasets" "/<int:dataset_id>/view", methods=["GET"]) @require_login @with_dataset( species_redirect_uri="species.populations.phenotypes.index", population_redirect_uri="species.populations.phenotypes.select_population", redirect_uri="species.populations.phenotypes.list_datasets") def view_dataset(# pylint: disable=[unused-argument] species: dict, population: dict, dataset: dict, **kwargs): """View a specific dataset""" with database_connection(app.config["SQL_URI"]) as conn: dataset = dataset_by_id( conn, species["SpeciesId"], population["Id"], dataset["Id"]) if not bool(dataset): flash("Could not find such a phenotype dataset!", "alert-danger") return redirect(url_for( "species.populations.phenotypes.list_datasets", species_id=species["SpeciesId"], population_id=population["Id"])) start_at = max(safe_int(request.args.get("start_at") or 0), 0) count = int(request.args.get("count") or 20) return render_template("phenotypes/view-dataset.html", species=species, population=population, dataset=dataset, phenotype_count=phenotypes_count( conn, population["Id"], dataset["Id"]), phenotypes=enumerate_sequence( dataset_phenotypes(conn, population["Id"], dataset["Id"], offset=start_at, limit=count), start=start_at+1), start_from=start_at, count=count, activelink="view-dataset") @phenotypesbp.route( "<int:species_id>/populations/<int:population_id>/phenotypes/datasets" "/<int:dataset_id>/phenotype/<xref_id>", methods=["GET"]) @require_login @with_dataset( species_redirect_uri="species.populations.phenotypes.index", population_redirect_uri="species.populations.phenotypes.select_population", redirect_uri="species.populations.phenotypes.list_datasets") def view_phenotype(# pylint: disable=[unused-argument] species: dict, population: dict, dataset: dict, xref_id: int, **kwargs ): """View an individual phenotype from the dataset.""" def __render__(privileges): return render_template( "phenotypes/view-phenotype.html", species=species, population=population, dataset=dataset, phenotype=phenotype_by_id(conn, species["SpeciesId"], population["Id"], dataset["Id"], xref_id), privileges=(privileges ### For demo! Do not commit this part + ("group:resource:edit-resource", "group:resource:delete-resource",) ### END: For demo! Do not commit this part ), activelink="view-phenotype") def __fail__(error): if isinstance(error, Response) and error.json() == "No linked resource!": return __render__(tuple()) return make_either_error_handler( "There was an error fetching the roles and privileges.")(error) with database_connection(app.config["SQL_URI"]) as conn: return oauth2_post( "/auth/resource/phenotypes/individual/linked-resource", json={ "species_id": species["SpeciesId"], "population_id": population["Id"], "dataset_id": dataset["Id"], "xref_id": xref_id } ).then( lambda resource: tuple( privilege["privilege_id"] for role in resource["roles"] for privilege in role["privileges"]) ).then(__render__).either(__fail__, lambda resp: resp) @phenotypesbp.route( "<int:species_id>/populations/<int:population_id>/phenotypes/datasets/create", methods=["GET", "POST"]) @require_login @with_population( species_redirect_uri="species.populations.phenotypes.index", redirect_uri="species.populations.phenotypes.select_population") def create_dataset(species: dict, population: dict, **kwargs):# pylint: disable=[unused-argument] """Create a new phenotype dataset.""" with (database_connection(app.config["SQL_URI"]) as conn, conn.cursor(cursorclass=DictCursor) as cursor): if request.method == "GET": return render_template("phenotypes/create-dataset.html", activelink="create-dataset", species=species, population=population, **decode_errors( request.args.get("error_values", ""))) form = request.form _errors: tuple[tuple[str, str], ...] = tuple() if not is_valid_representative_name( (form.get("dataset-name") or "").strip()): _errors = _errors + (("dataset-name", "Invalid dataset name."),) if not bool((form.get("dataset-fullname") or "").strip()): _errors = _errors + (("dataset-fullname", "You must provide a value for 'Full Name'."),) if bool(_errors) > 0: return redirect(url_for( "species.populations.phenotypes.create_dataset", species_id=species["SpeciesId"], population_id=population["Id"], error_values=encode_errors(_errors, form))) dataset_shortname = ( form["dataset-shortname"] or form["dataset-name"]).strip() _pheno_dataset = save_new_dataset( cursor, population["Id"], form["dataset-name"].strip(), form["dataset-fullname"].strip(), dataset_shortname) return redirect(url_for("species.populations.phenotypes.list_datasets", species_id=species["SpeciesId"], population_id=population["Id"])) def process_phenotypes_rqtl2_bundle( rconn: Redis, species: dict, population: dict, dataset: dict): """Process phenotypes from the uploaded R/qtl2 bundle.""" _redisuri = app.config["REDIS_URL"] _sqluri = app.config["SQL_URI"] try: ## Handle huge files here... phenobundle = save_file(request.files["phenotypes-bundle"], Path(app.config["UPLOAD_FOLDER"])) rqc.validate_bundle(phenobundle) except AssertionError as _aerr: app.logger.debug("File upload error!", exc_info=True) flash("Expected a zipped bundle of files with phenotypes' " "information.", "alert-danger") return add_phenos_uri except rqe.RQTLError as rqtlerr: app.logger.debug("Bundle validation error!", exc_info=True) flash("R/qtl2 Error: " + " ".join(rqtlerr.args), "alert-danger") return add_phenos_uri _jobid = uuid.uuid4() _namespace = jobs.jobsnamespace() _ttl_seconds = app.config["JOBS_TTL_SECONDS"] _job = jobs.launch_job( jobs.initialise_job( rconn, _namespace, str(_jobid), [sys.executable, "-m", "scripts.rqtl2.phenotypes_qc", _sqluri, _redisuri, _namespace, str(_jobid), str(species["SpeciesId"]), str(population["Id"]), # str(dataset["Id"]), str(phenobundle), "--loglevel", { INFO: "INFO", ERROR: "ERROR", DEBUG: "DEBUG", FATAL: "FATAL", CRITICAL: "CRITICAL", WARNING: "WARNING" }[app.logger.getEffectiveLevel()], "--redisexpiry", str(_ttl_seconds)], "phenotype_qc", _ttl_seconds, {"job-metadata": json.dumps({ "speciesid": species["SpeciesId"], "populationid": population["Id"], "datasetid": dataset["Id"], "bundle": str(phenobundle.absolute())})}), _redisuri, f"{app.config['UPLOAD_FOLDER']}/job_errors") app.logger.debug("JOB DETAILS: %s", _job) return redirect(url_for("species.populations.phenotypes.job_status", species_id=species["SpeciesId"], population_id=population["Id"], dataset_id=dataset["Id"], job_id=str(_job["jobid"]))) def process_phenotypes_individual_files(rconn, species, population, dataset): """Process the uploaded individual files.""" ## Handle huge file uploads here... ## Convert files and settings to R/qtl2 bundle ## Use same processing as R/qtl2 bundle (after some refactoring) raise NotImplementedError("Implement this!") @phenotypesbp.route( "<int:species_id>/populations/<int:population_id>/phenotypes/datasets" "/<int:dataset_id>/add-phenotypes", methods=["GET", "POST"]) @require_login @with_dataset( species_redirect_uri="species.populations.phenotypes.index", population_redirect_uri="species.populations.phenotypes.select_population", redirect_uri="species.populations.phenotypes.list_datasets") def add_phenotypes(species: dict, population: dict, dataset: dict, **kwargs):# pylint: disable=[unused-argument, too-many-locals] """Add one or more phenotypes to the dataset.""" use_bundle = request.args.get("use_bundle", "").lower() == "true" add_phenos_uri = redirect(url_for( "species.populations.phenotypes.add_phenotypes", species_id=species["SpeciesId"], population_id=population["Id"], dataset_id=dataset["Id"])) _redisuri = app.config["REDIS_URL"] _sqluri = app.config["SQL_URI"] with (Redis.from_url(_redisuri, decode_responses=True) as rconn, # database_connection(_sqluri) as conn, # conn.cursor(cursorclass=DictCursor) as cursor ): if request.method == "GET": today = datetime.date.today() return render_template( ("phenotypes/add-phenotypes-with-rqtl2-bundle.html" if use_bundle else "phenotypes/add-phenotypes-raw-files.html"), species=species, population=population, dataset=dataset, monthnames=( "January", "February", "March", "April", "May", "June", "July", "August", "September", "October", "November", "December"), current_month=today.strftime("%B"), current_year=int(today.strftime("%Y")), families_with_se_and_n=( "Reference Populations (replicate average, SE, N)",), use_bundle=use_bundle, activelink="add-phenotypes") if use_bundle: return process_phenotypes_rqtl2_bundle( rconn, species, population, dataset) return process_phenotypes_individual_files( rconn, species, population, dataset) @phenotypesbp.route( "<int:species_id>/populations/<int:population_id>/phenotypes/datasets" "/<int:dataset_id>/job/<uuid:job_id>", methods=["GET"]) @require_login @with_dataset( species_redirect_uri="species.populations.phenotypes.index", population_redirect_uri="species.populations.phenotypes.select_population", redirect_uri="species.populations.phenotypes.list_datasets") def job_status( species: dict, population: dict, dataset: dict, job_id: uuid.UUID, **kwargs ):# pylint: disable=[unused-argument] """Retrieve current status of a particular phenotype QC job.""" with Redis.from_url(app.config["REDIS_URL"], decode_responses=True) as rconn: try: job = jobs.job(rconn, jobs.jobsnamespace(), str(job_id)) except jobs.JobNotFound as _jnf: job = None return render_template("phenotypes/job-status.html", species=species, population=population, dataset=dataset, job_id=job_id, job=job, errors=jobs.job_errors( rconn, jobs.jobsnamespace(), job['jobid']), metadata=jobs.job_files_metadata( rconn, jobs.jobsnamespace(), job['jobid']), activelink="add-phenotypes")