about summary refs log tree commit diff
path: root/genenetwork/services/genenetwork.scm
diff options
context:
space:
mode:
Diffstat (limited to 'genenetwork/services/genenetwork.scm')
-rw-r--r--genenetwork/services/genenetwork.scm239
1 files changed, 182 insertions, 57 deletions
diff --git a/genenetwork/services/genenetwork.scm b/genenetwork/services/genenetwork.scm
index b863bcf..9ba6213 100644
--- a/genenetwork/services/genenetwork.scm
+++ b/genenetwork/services/genenetwork.scm
@@ -57,6 +57,7 @@
             genenetwork-configuration-port           ; external port
             genenetwork-configuration-gn2-port       ; internal port
             genenetwork-configuration-gn3-port       ; internal port
+            genenetwork-configuration-gn-guile-port  ; aka gn4 internal port (may be external)
             genenetwork-configuration-auth-db        ; RW auth DB
             genenetwork-configuration-xapian-db      ; RO search index, unless you want to regenerate inside VM
             genenetwork-configuration-genotype-files ; RO genotype files
@@ -109,16 +110,24 @@
                            (default "/var/empty"))
   (gn3-data-directory genenetwork-configuration-gn3-data-directory
                       (default "/var/genenetwork"))
+  (gn2-sessions-dir genenetwork-configuration-gn2-sessions-dir
+                    (default "/var/genenetwork/sessions/genenetwork2"))
   (gn2-secrets genenetwork-configuration-gn2-secrets
                (default "/etc/genenetwork"))
   (gn3-secrets genenetwork-configuration-gn3-secrets
                (default "/etc/genenetwork/gn3-secrets.py"))
   (gn-auth-secrets genenetwork-configuration-gn-auth-secrets
                    (default "/etc/genenetwork"))
+  (gn-guile genenetwork-configuration-gn-guile
+            (default gn-guile))
   (gn-guile-port genenetwork-configuration-gn-guile-port
                  (default 8091))
   (gn-doc-git-checkout genenetwork-configuration-gn-doc-git-checkout
                        (default "/export/data/gn-docs"))
+  (gn-virtuoso-ttl-directory genenetwork-configuration-gn-virtuoso-ttl-directory
+                             (default "/export/data/virtuoso/ttl"))
+  (gn-tmpdir genenetwork-configuration-gn-tmpdir
+             (default "/opt/gn/tmp"))
   (log-level genenetwork-configuration-log-level
              (default 'warning)
              (sanitize sanitize-log-level)))
@@ -142,6 +151,10 @@
                    (default "https://auth.genenetwork.org"))
   (gn2-server-url gn-uploader-configuration-gn2-server-url
                   (default "https://genenetwork.org"))
+  (sessions-dir gn-uploader-sessions-dir
+                (default "/var/genenetwork/sessions/gn-uploader"))
+  (sqlite-databases-directory gn-uploader-sqlite-databases-directory
+                              (default "/var/genenetwork/sqlite/gn-uploader"))
   (log-level gn-uploader-configuration-log-level
              (default 'warning)
              (sanitize sanitize-log-level)))
@@ -170,6 +183,8 @@
          (genenetwork3 (genenetwork-configuration-genenetwork3 config))
          (xapian-directory (genenetwork-configuration-xapian-db config))
          (sparql-endpoint (genenetwork-configuration-sparql-endpoint config))
+         (virtuoso-ttl-directory
+          (genenetwork-configuration-gn-virtuoso-ttl-directory config))
          (xapian-build-directory (string-append xapian-directory "/build"))
          (herd (file-append shepherd "/bin/herd"))
          (index-genenetwork (file-append genenetwork3 "/bin/index-genenetwork"))
@@ -203,7 +218,9 @@
                                                   "is-data-modified"
                                                   #$xapian-directory
                                                   #$sql-uri
-                                                  #$sparql-endpoint))))
+                                                  #$sparql-endpoint
+                                                  "--virtuoso-ttl-directory"
+                                                  #$virtuoso-ttl-directory))))
             (dynamic-wind
               (const #t)
               ;; build the index
@@ -212,7 +229,9 @@
                         "create-xapian-index"
                         #$xapian-build-directory
                         #$sql-uri
-                        #$sparql-endpoint)
+                        #$sparql-endpoint
+                        "--virtuoso-ttl-directory"
+                        #$virtuoso-ttl-directory)
                 (dynamic-wind
                   ;; stop GN3: Here there is magic!!!
                   ;;     The name `gunicorn-genenetwork' is magical. It is not set
@@ -240,9 +259,35 @@
                             (chmod file #o644))
                           (find-files #$xapian-directory)))))))))
 
+(define (samples-count-script-gexp config)
+  (match-record config <genenetwork-configuration>
+                (genenetwork2 sql-uri)
+    (with-imported-modules '((guix build utils))
+      #~(begin
+          (use-modules (guix build utils))
+
+          (setenv "PYTHONPATH"
+                  (string-append
+                   #$(file-append genenetwork2
+                                  "/lib/python"
+                                  (python-version (package-version python))
+                                  "/site-packages")
+                   ":"
+                   #$(profile
+                       (content (package->development-manifest genenetwork2))
+                       (allow-collisions? #t))
+                   "/lib/python"
+                   #$(python-version (package-version python))
+                   "/site-packages"))
+
+          (invoke #$(file-append python "/bin/python3")
+                  "-m"
+                  "gn2.scripts.sample_count"
+                  #$sql-uri)))))
+
 (define (genenetwork-activation config)
   (match-record config <genenetwork-configuration>
-    (gn2-secrets gn3-secrets gn-auth-secrets auth-db llm-db-path)
+    (gn2-secrets gn3-secrets gn-auth-secrets auth-db llm-db-path genotype-files gn-tmpdir gn-doc-git-checkout gn2-sessions-dir)
     (with-imported-modules '((guix build utils))
       #~(begin
           (use-modules (guix build utils))
@@ -262,7 +307,11 @@
                              (passwd:uid (getpw "gunicorn-genenetwork2"))
                              (passwd:gid (getpw "gunicorn-genenetwork2"))))
                     (append (list #$gn2-secrets)
+                            (find-files #$genotype-files
+                                        #:directories? #t)
                             (find-files #$gn2-secrets
+                                        #:directories? #t)
+                            (find-files #$gn2-sessions-dir
                                         #:directories? #t)))
           (for-each (lambda (file)
                       (chown file
@@ -278,7 +327,31 @@
                             (find-files #$gn2-secrets
                                         #:directories? #f)
                             (find-files #$gn-auth-secrets
-                                        #:directories? #f)))))))
+                                        #:directories? #f)))
+          ;; Make sub-directories for various apps under gn-tmpdir and assign
+          ;; appropriate permissions
+          (for-each (match-lambda
+                      ((subdir user)
+                       (let ((full-path
+                              (string-append #$gn-tmpdir "/" subdir)))
+                         (unless (file-exists? full-path)
+                           (mkdir full-path #o755))
+                         (for-each (lambda (file)
+                                     (chown file
+                                            (passwd:uid (getpw user))
+                                            (passwd:gid (getpw user))))
+                                   (find-files full-path
+                                               #:directories? #t)))))
+                    '(("gn2-tmpdir" "gunicorn-genenetwork2")
+                      ("gn3-tmpdir" "gunicorn-genenetwork3")))
+
+          ;; setup correct ownership for gn-docs
+          (for-each (lambda (file)
+                      (chown file
+                             (passwd:uid (getpw "genenetwork"))
+                             (passwd:gid (getpw "genenetwork"))))
+                    (find-files #$(dirname gn-doc-git-checkout)
+                                #:directories? #t))))))
 
 (define (configuration-file-gexp alist)
   "Return a G-expression that constructs a configuration file of
@@ -309,7 +382,7 @@ G-expressions or numbers."
 described by @var{config}, a @code{<genenetwork-configuration>}
 object."
   (match-record config <genenetwork-configuration>
-    (genenetwork2 genenetwork3 gn-auth server-name gn-auth-server-name gn2-port gn3-port gn-auth-port sql-uri auth-db xapian-db genotype-files sparql-endpoint gn-sourcecode-directory gn3-data-directory gn2-secrets gn3-secrets gn-auth-secrets llm-db-path log-level)
+    (genenetwork2 genenetwork3 gn-auth server-name gn-auth-server-name gn2-port gn3-port gn-auth-port sql-uri auth-db xapian-db genotype-files gn2-sessions-dir sparql-endpoint gn-sourcecode-directory gn3-data-directory gn2-secrets gn3-secrets gn-auth-secrets llm-db-path gn-tmpdir log-level gn-guile-port)
     ;; If we mapped only the mysqld.sock socket file, it would break
     ;; when the external mysqld server is restarted.
     (let* ((database-mapping (file-system-mapping
@@ -328,12 +401,16 @@ object."
                                        ("GENENETWORK_FILES" ,genotype-files)
                                        ("GN3_LOCAL_URL" ,(string-append "http://localhost:"
                                                                         (number->string gn3-port)))
+                                       ("GN_GUILE_SERVER_URL" ,(string-append "http://localhost:" ; AKA GN4
+                                                                        (number->string gn-guile-port) "/" ))
                                        ("GN_SERVER_URL" ,(string-append "https://" server-name "/api3/"))
                                        ("AUTH_SERVER_URL" ,(string-append "https://" gn-auth-server-name "/"))
                                        ("JS_GUIX_PATH" ,(file-append gn2-profile "/share/genenetwork2/javascript"))
                                        ("PLINK_COMMAND" ,(file-append gn2-profile "/bin/plink2"))
                                        ("SQL_URI" ,sql-uri)
-                                       ("AI_SEARCH_ENABLED" "True")))))
+                                       ("AI_SEARCH_ENABLED" "True")
+                                       ("SESSION_FILESYSTEM_CACHE_PATH" ,gn2-sessions-dir)
+                                       ("MAX_FORM_MEMORY_SIZE" 52428800)))))
            (gn3-profile (profile
                          (content (package->development-manifest genenetwork3))
                          (allow-collisions? #t)))
@@ -342,6 +419,8 @@ object."
                                     (configuration-file-gexp
                                      `(("AUTH_DB" ,auth-db)
                                        ("AUTH_SERVER_URL" ,(string-append "https://" gn-auth-server-name "/"))
+                                       ("GN_GUILE_SERVER_URL" ,(string-append "http://localhost:" ; AKA GN4
+                                                                        (number->string gn-guile-port) "/"))
                                        ("DATA_DIR" ,gn3-data-directory)
                                        ("SOURCE_DIR" ,gn-sourcecode-directory)
                                        ("SPARQL_ENDPOINT" ,sparql-endpoint)
@@ -358,9 +437,9 @@ object."
                                         (configuration-file-gexp
                                          `(("GN_AUTH_SECRETS" ,(string-append gn-auth-secrets "/gn-auth-secrets.py"))
                                            ("AUTH_DB" ,auth-db)
-                                           ("SQL_URI" ,sql-uri)
-                                           ("CLIENTS_SSL_PUBLIC_KEYS_DIR" ,(string-append gn-auth-secrets "/clients-public-keys"))
-                                           ("SSL_PRIVATE_KEY" ,(string-append gn-auth-secrets "/gn-auth-ssl-private-key.pem")))))))
+                                           ("SQL_URI" ,sql-uri)))))
+           (gn2-tmpdir (string-append gn-tmpdir "/gn2-tmpdir"))
+           (gn3-tmpdir (string-append gn-tmpdir "/gn3-tmpdir")))
       (list (gunicorn-app
              (name "genenetwork2")
              (package genenetwork2)
@@ -375,7 +454,7 @@ object."
                      (value gn2-profile))
                     (environment-variable
                      (name "TMPDIR")
-                     (value "/tmp"))
+                     (value gn2-tmpdir))
                     (environment-variable
                      (name "GN2_SETTINGS")
                      (value gn2-conf))
@@ -388,13 +467,17 @@ object."
              (mappings (list database-mapping
                              (file-system-mapping
                               (source genotype-files)
-                              (target source))
+                              (target source)
+                              (writable? #t))
                              (file-system-mapping
                               (source gn-sourcecode-directory)
                               (target source))
-                             (file-system-mapping ; GN2 and GN3 need to share TMPDIR
-                              (source "/tmp")
-                              (target "/tmp")
+                             (file-system-mapping ; GN2 and GN3 need to communicate via TMPDIR
+                              (source gn-tmpdir)
+                              (target source))
+                             (file-system-mapping
+                              (source gn2-tmpdir)
+                              (target source)
                               (writable? #t))
                              (file-system-mapping
                               (source gn2-conf)
@@ -408,7 +491,11 @@ object."
                               (writable? #t))
                              (file-system-mapping
                               (source gn2-ca-bundle)
-                              (target source))))
+                              (target source))
+                             (file-system-mapping
+                              (source gn2-sessions-dir)
+                              (target source)
+                              (writable? #t))))
              (extra-cli-arguments
               (list "--log-level"
                     (string-upcase (symbol->string log-level)))))
@@ -429,7 +516,7 @@ object."
                      (value gn3-conf))
                     (environment-variable
                      (name "TMPDIR")
-                     (value "/tmp"))
+                     (value gn3-tmpdir))
                     (environment-variable
                      (name "GN3_SECRETS")
                      (value gn3-secrets))
@@ -455,15 +542,18 @@ object."
                              (file-system-mapping
                               (source gn3-data-directory)
                               (target source))    ; Rqtl usese this
-                             (file-system-mapping ; GN2 and GN3 need to share TMPDIR
-                              (source "/tmp")
-                              (target "/tmp")
+                             (file-system-mapping ; GN2 and GN3 need to communicate via TMPDIR
+                              (source gn-tmpdir)
+                              (target source))
+                             (file-system-mapping
+                              (source gn3-tmpdir)
+                              (target source)
                               (writable? #t))
                              (file-system-mapping
                               (source xapian-db)
                               (target source))
                              (file-system-mapping
-                              (source llm-db-path)
+                              (source (dirname llm-db-path))
                               (target source)
                               (writable? #t))
                              (file-system-mapping
@@ -479,6 +569,7 @@ object."
                              (port gn-auth-port))))
              (wsgi-app-module "gn_auth:create_app()")
              (workers 20)
+             (timeout 1200)
              (environment-variables
               (list (environment-variable
                      (name "GN_AUTH_CONF")
@@ -497,9 +588,9 @@ object."
                               (source gn-auth-conf)
                               (target source))
                              (file-system-mapping
-                              (source auth-db)
-                              (target source)
-                              (writable? #t))
+                               (source (dirname auth-db))
+                               (target source)
+                               (writable? #t))
                              (file-system-mapping
                               (source gn-auth-secrets)
                               (target source)
@@ -526,7 +617,8 @@ a @code{<genenetwork-configuration>} record."
                                               (number->string gn2-port) ";")
                                "proxy_set_header Host $host;"
                                "proxy_read_timeout 20m;"
-                               "proxy_set_header X-Forwarded-Proto $scheme;")))
+                               "proxy_set_header X-Forwarded-Proto $scheme;"
+                               "client_max_body_size 8050m;")))
                   (nginx-location-configuration
                    (uri "/api3/")
                    (body (list "rewrite /api3/(.*) /api/$1 break;"
@@ -555,24 +647,38 @@ a @code{<genenetwork-configuration>} record."
   (list #~(job '(next-hour)
                #$(program-file "build-xapian-index-cron-gexp"
                                (build-xapian-index-cron-gexp config))
-               #:user "root")))
+               #:user "root")
+        #~(job '(next-minute-from (next-hour) '(17)) ;17th minute of every hour
+               #$(program-file "samples-count-script-gexp"
+                               (samples-count-script-gexp config)))))
 
-(define (gn-guile-gexp gn-guile-port)
+(define (gn-guile-gexp gn-guile-port gn-guile-pkg bare-repo)
   (with-imported-modules '((guix build utils))
     #~(begin
         (use-modules (guix build utils))
-        (let ((current-repo-path (string-append (getcwd) "/gn-docs")))
+        (let* ((gn-guile-profile #$(profile (content (package->development-manifest gn-guile-pkg))
+                                            (allow-collisions? #t)))
+               (ssl-cert-dir (string-append gn-guile-profile "/etc/ssl/certs"))
+               (ssl-cert-file (string-append ssl-cert-dir "/ca-certificates.crt"))
+               (current-repo-path (string-append (pk "CWD" (getcwd)) "/gn-docs")))
+          ;; These have to be setup manually here an not in the
+          ;; `gn-guile-shepherd-service' function, otherwise, they do not take
+          ;; effect for some reason.
+          (setenv "SSL_CERT_DIR" ssl-cert-dir)
+          (setenv "SSL_CERT_FILE" ssl-cert-file)
+          (setenv "GUILE_TLS_CERTIFICATE_DIRECTORY" ssl-cert-dir)
+
           (when (file-exists? current-repo-path)
             (delete-file-recursively current-repo-path))
           (setenv "CURRENT_REPO_PATH" current-repo-path)
           (invoke #$(file-append git-minimal "/bin/git")
-                  "clone" "--depth" "1" (getenv "CGIT_REPO_PATH")))
+                  "clone" "--depth" "1" #$(string-append "file://" bare-repo)))
         (invoke #$(file-append gn-guile "/bin/gn-guile")
                 (number->string #$gn-guile-port)))))
 
 (define (gn-guile-shepherd-service config)
   (match-record config <genenetwork-configuration>
-    (gn-doc-git-checkout gn-guile-port)
+    (gn-guile gn-doc-git-checkout gn-guile-port)
     (shepherd-service
      (documentation "Run gn-guile server.")
      (provision '(gn-guile))
@@ -588,14 +694,15 @@ a @code{<genenetwork-configuration>} record."
         #~(make-forkexec-constructor
 	   (list #$(least-authority-wrapper
                     (program-file "gn-guile"
-                                  (gn-guile-gexp gn-guile-port))
+                                  (gn-guile-gexp gn-guile-port gn-guile gn-doc-git-checkout))
                     #:name "gn-guile-pola-wrapper"
+                    #:directory (dirname gn-doc-git-checkout)
                     #:preserved-environment-variables
                     (map first gn-guile-settings)
                     #:mappings (list (file-system-mapping
-                                      (source gn-doc-git-checkout)
-                                      (target source)
-                                      (writable? #t)))
+                                       (source (dirname gn-doc-git-checkout))
+                                       (target source)
+                                       (writable? #t)))
                     #:namespaces (delq 'net %namespaces))
                  "127.0.0.1" #$(number->string gn-guile-port))
            #:user "genenetwork"
@@ -628,14 +735,20 @@ a @code{<genenetwork-configuration>} record."
 
 (define (gn-uploader-activation config)
   (match-record config <gn-uploader-configuration>
-    (secrets data-directory)
+    (secrets data-directory sessions-dir sqlite-databases-directory)
     (with-imported-modules '((guix build utils))
       #~(begin
           (use-modules (guix build utils))
           ;; Let service user own their own secrets files.
-          (chown #$secrets
-                 (passwd:uid (getpw "gunicorn-gn-uploader"))
-                 (passwd:gid (getpw "gunicorn-gn-uploader")))
+          (for-each (lambda (file)
+                      (chown file
+                             (passwd:uid (getpw "gunicorn-gn-uploader"))
+                             (passwd:gid (getpw "gunicorn-gn-uploader"))))
+                    (append (list #$(dirname secrets))
+                            (find-files #$sessions-dir
+                                        #:directories? #t)
+                            (find-files #$sqlite-databases-directory
+                                        #:directories? #t)))
           ;; Set owner-only permissions on secrets files.
           (for-each (lambda (file)
                       (chmod file #o600))
@@ -651,25 +764,27 @@ a @code{<genenetwork-configuration>} record."
 
 (define (gn-uploader-gunicorn-app config)
   (match-record config <gn-uploader-configuration>
-    (gn-uploader sql-uri port data-directory secrets log-level auth-server-url gn2-server-url)
+    (gn-uploader sql-uri port data-directory secrets log-level auth-server-url gn2-server-url sessions-dir sqlite-databases-directory)
     ;; If we mapped only the mysqld.sock socket file, it would break
     ;; when the external mysqld server is restarted.
-    (let ((database-mapping (file-system-mapping
-                             (source "/run/mysqld")
-                             (target source)
-                             (writable? #t)))
-          (gn-uploader-conf (computed-file "gn-uploader.conf"
-                                           (configuration-file-gexp
-                                            `(("UPLOADER_SECRETS" ,secrets)
-                                              ("SQL_URI" ,sql-uri)
-                                              ("UPLOAD_FOLDER" ,(string-append data-directory
-                                                                               "/uploads"))
-                                              ("AUTH_SERVER_URL" ,auth-server-url)
-                                              ("GN2_SERVER_URL" ,gn2-server-url)))))
-          (gn-uploader-profile (profile
-                                (content (package->development-manifest gn-uploader))
-                                (allow-collisions? #t)))
-          (gn-uploader-ca-bundle (file-append gn-uploader-profile "/etc/ssl/certs/ca-certificates.crt")))
+    (let* ((database-mapping (file-system-mapping
+                              (source "/run/mysqld")
+                              (target source)
+                              (writable? #t)))
+           (gn-uploader-conf (computed-file "gn-uploader.conf"
+                                            (configuration-file-gexp
+                                             `(("UPLOADER_SECRETS" ,secrets)
+                                               ("SQL_URI" ,sql-uri)
+                                               ("UPLOAD_FOLDER" ,(string-append data-directory
+                                                                                "/uploads"))
+                                               ("AUTH_SERVER_URL" ,auth-server-url)
+                                               ("GN2_SERVER_URL" ,gn2-server-url)
+                                               ("SESSION_FILESYSTEM_CACHE_PATH" ,sessions-dir)
+                                               ("ASYNCHRONOUS_JOBS_SQLITE_DB" ,(string-append sqlite-databases-directory "/background-jobs.db"))))))
+           (gn-uploader-profile (profile
+                                 (content (package->development-manifest gn-uploader))
+                                 (allow-collisions? #t)))
+           (gn-uploader-ca-bundle (file-append gn-uploader-profile "/etc/ssl/certs/ca-certificates.crt")))
       (list (gunicorn-app
              (name "gn-uploader")
              (package gn-uploader)
@@ -677,6 +792,7 @@ a @code{<genenetwork-configuration>} record."
                              (port port))))
              (wsgi-app-module "scripts.qcapp_wsgi:app")
              (workers 20)
+             (timeout 1200)
              (environment-variables
               (list (environment-variable
                      (name "UPLOADER_CONF")
@@ -695,8 +811,9 @@ a @code{<genenetwork-configuration>} record."
                               (source gn-uploader-conf)
                               (target source))
                              (file-system-mapping
-                              (source secrets)
-                              (target source))
+                              (source (dirname secrets))
+                              (target source)
+                              (writable? #t))
                              (file-system-mapping
                               (source data-directory)
                               (target source)
@@ -706,7 +823,15 @@ a @code{<genenetwork-configuration>} record."
                               (target source))
                              (file-system-mapping
                               (source gn-uploader-ca-bundle)
-                              (target source))))
+                              (target source))
+                             (file-system-mapping
+                              (source sessions-dir)
+                              (target source)
+                              (writable? #t))
+                             (file-system-mapping
+                              (source sqlite-databases-directory)
+                              (target source)
+                              (writable? #t))))
              (extra-cli-arguments
               (list "--log-level"
                     (string-upcase (symbol->string log-level)))))))))