From 602514e0ab5118590ae052fbd801f7fb596436a8 Mon Sep 17 00:00:00 2001 From: Munyoki Kilyungi Date: Mon, 12 Feb 2024 23:04:14 +0300 Subject: Retrieve metadata from text files given a path. * gn3/db/datasets.py (retrieve_trait_dataset): New file. Signed-off-by: Munyoki Kilyungi --- gn3/db/datasets.py | 21 +++++++++++++++++++++ 1 file changed, 21 insertions(+) (limited to 'gn3/db') diff --git a/gn3/db/datasets.py b/gn3/db/datasets.py index 6e3977f..5501d92 100644 --- a/gn3/db/datasets.py +++ b/gn3/db/datasets.py @@ -3,6 +3,7 @@ This module contains functions relating to specific trait dataset manipulation """ import os from typing import Any +from pathlib import Path from flask import current_app as app @@ -330,3 +331,23 @@ def retrieve_trait_dataset(trait_type, trait, threshold, conn): **dataset_fns[trait_type](), **group } + + +def retrieve_dataset_metadata(name: str) -> dict: + """Return the full data given a path, NAME""" + result = {} + __subject = { + "summary": "dct:description", + "tissue": "gnt:hasTissueInfo", + "specifics": "gnt:hasTissueInfo", + "cases": "gnt:hasCaseInfo", + "platform": "gnt:hasPlatformInfo", + "processing": "gnt:hasDataProcessingInfo", + "notes": "gnt:hasNotes", + "experiment-design": "gnt:hasExperimentDesignInfo", + "acknowledgment": "gnt:hasAcknowledgement", + } + for __file in Path(name).glob("*rtf"): + with __file.open() as _f: + result[__subject.get(__file.stem, f"gn:{__file.stem}")] = _f.read() + return result -- cgit v1.2.3