about summary refs log tree commit diff
path: root/gn3/db
diff options
context:
space:
mode:
authorBonfaceKilz2022-03-10 13:27:06 +0300
committerBonfaceKilz2022-03-12 15:33:09 +0300
commit7641343e90f9a7f03cf0baf30818675efac6d7f3 (patch)
tree723b04515a5ea206a385b699a54d685ba3cd26a3 /gn3/db
parent9b714166cf0ebbbb098a52b97d7c9b4e3ec13a2e (diff)
downloadgenenetwork3-7641343e90f9a7f03cf0baf30818675efac6d7f3.tar.gz
Create action dict that's created when updating data
* gn3/db/sample_data.py (__extract_actions): An update on a vector of data can
contain: inserts, deletes and updates. This functions extracts these actions
during an update.
* tests/unit/db/test_sample_data.py (test_extract_actions): Add test-case for
the above.
Diffstat (limited to 'gn3/db')
-rw-r--r--gn3/db/sample_data.py32
1 files changed, 32 insertions, 0 deletions
diff --git a/gn3/db/sample_data.py b/gn3/db/sample_data.py
index ccb03f2..06c3cc5 100644
--- a/gn3/db/sample_data.py
+++ b/gn3/db/sample_data.py
@@ -11,6 +11,38 @@ _MAP = {
 }
 
 
+def __extract_actions(original_data: str,
+                      updated_data: str,
+                      csv_header: str) -> dict:
+    original_data = original_data.strip().split(",")
+    updated_data = updated_data.strip().split(",")
+    csv_header = csv_header.strip().split(",")
+    result = {
+        "delete": {"data": [], "csv_header": []},
+        "insert": {"data": [], "csv_header": []},
+        "update": {"data": [], "csv_header": []},
+    }
+    for _o, _u, _h in zip(original_data, updated_data, csv_header):
+        if _o == _u:  # No change
+            continue
+        elif _o and _u == "x":  # Deletion
+            result["delete"]["data"].append(_o)
+            result["delete"]["csv_header"].append(_h)
+        elif _o == "x" and _u:  # Insert
+            result["insert"]["data"].append(_u)
+            result["insert"]["csv_header"].append(_h)
+        elif _o and _u:  # Update
+            result["update"]["data"].append(_u)
+            result["update"]["csv_header"].append(_h)
+    for key, val in result.items():
+        if not val["data"]:
+            result[key] = None
+        else:
+            result[key]["data"] = ",".join(result[key]["data"])
+            result[key]["csv_header"] = ",".join(result[key]["csv_header"])
+    return result
+
+
 def get_trait_csv_sample_data(conn: Any,
                               trait_name: int, phenotype_id: int) -> str:
     """Fetch a trait and return it as a csv string"""