about summary refs log tree commit diff
path: root/transform
diff options
context:
space:
mode:
authorMunyoki Kilyungi2023-11-24 14:42:32 +0300
committerMunyoki Kilyungi2023-11-24 14:42:32 +0300
commit54ba0cc5e8ed477a0d98f6a35cad74115814e257 (patch)
tree8691e8052b055492d93dc8996d71d1bf97e1cbb3 /transform
parentdbc5bbac28deb8ffe2ae2ec0e037885bba9e5be0 (diff)
downloadgn-transform-databases-54ba0cc5e8ed477a0d98f6a35cad74115814e257.tar.gz
Move remap-species-identifier to strings.scm.
Signed-off-by: Munyoki Kilyungi <me@bonfacemunyoki.com>
Diffstat (limited to 'transform')
-rw-r--r--transform/strings.scm12
1 files changed, 12 insertions, 0 deletions
diff --git a/transform/strings.scm b/transform/strings.scm
index 7d9bc82..7545f62 100644
--- a/transform/strings.scm
+++ b/transform/strings.scm
@@ -11,6 +11,7 @@
             delete-substrings
             replace-substrings
             remove-duplicates
+            remap-species-identifiers str
             sanitize-rdf-string
             snake->lower-camel
             lower-case-and-replace-spaces
@@ -119,3 +120,14 @@ association list mapping substrings to their replacements."
       ((null? lst) (reverse result))
       ((memq (car lst) result) (loop (cdr lst) result))
       (else (loop (cdr lst) (cons (car lst) result))))))
+
+
+(define (remap-species-identifiers str)
+  "This procedure remaps identifiers to standard binominal. Obviously this should
+   be sorted by correcting the database!"
+  (match str
+    ["Fly (Drosophila melanogaster dm6)" "Drosophila melanogaster"]
+    ["Oryzias latipes (Japanese medaka)" "Oryzias latipes"]
+    ["Macaca mulatta" "Macaca nemestrina"]
+    ["Bat (Glossophaga soricina)" "Glossophaga soricina"]
+    [str str]))