1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
|
#! /bin/sh -e
# genenetwork-machines --- Guix configuration for genenetwork machines
# Copyright © 2025 Munyoki Kilyungi <me@bonfacemunyoki.com>
#
# This file is part of genenetwork-machines.
#
# genenetwork-machines is free software: you can redistribute it
# and/or modify it under the terms of the GNU General Public License
# as published by the Free Software Foundation, either version 3 of
# the License, or (at your option) any later version.
#
# genenetwork-machines is distributed in the hope that it will be
# useful, but WITHOUT ANY WARRANTY; without even the implied warranty
# of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
# General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with genenetwork-machines. If not, see
# <https://www.gnu.org/licenses/>.
# Build and install genenetwork container on your local machine.
set -euo pipefail
BASE_DIR="${HOME:-/home/$USER}/genenetwork"
SYSTEM_DIRECTORIES=(
"$BASE_DIR/var/log"
"$BASE_DIR/var/genenetwork"
"$BASE_DIR/etc/genenetwork/conf"
"$BASE_DIR/etc/genenetwork"
"$BASE_DIR/var/lib/redis"
"$BASE_DIR/var/lib/virtuoso"
"$BASE_DIR/var/lib/data"
"$BASE_DIR/var/lib/xapian"
"$BASE_DIR/var/genenetwork/genotype-files/genotype/json"
"$BASE_DIR/var/lib/genenetwork-sqlite"
"$BASE_DIR/var/lib/genenetwork-gnqa"
"/tmp/local-container"
)
GN_PROJECTS=(
"genenetwork2:git@github.com:genenetwork/genenetwork2"
"genenetwork3:git@github.com:genenetwork/genenetwork3"
"gn-transform-databases:https://git.genenetwork.org/gn-transform-databases/"
"gn-auth:https://git.genenetwork.org/gn-auth"
"gn-docs:https://git.genenetwork.org/gn-docs"
)
# File mappings: source -> destination
declare -A FILE_MAPPINGS=(
["etc/auth.db"]="$BASE_DIR/var/genenetwork/auth.db"
["etc/llm.db"]="$BASE_DIR/var/lib/genenetwork-sqlite/llm.db"
["etc/gn2-secrets.py"]="$BASE_DIR/etc/genenetwork/conf/gn2/secrets.py"
["etc/gn3-secrets.py"]="$BASE_DIR/etc/genenetwork/conf/gn3/secrets.py"
["etc/gn-auth-secrets.py"]="$BASE_DIR/etc/genenetwork/conf/gn-auth/secrets.py"
)
CONTAINER_SCM="genenetwork-local-container.scm"
CONTAINER_BIN="/usr/local/bin/genenetwork-local-container"
GC_ROOT="/var/guix/gcroots/genenetwork-local-container"
log() {
local level="$1"
shift
echo "[$(date '+%Y-%m-%d %H:%M:%S')] $level: $*" >&2
}
# Check dependencies
for cmd in git guix sudo diff cp grep; do
if ! command -v "$cmd" &>/dev/null; then
log "ERROR" "Required command '$cmd' not found"
exit 1
fi
done
# Check for gn-bioinformatics channel
guix describe | grep gn-bioinformatics &> /dev/null && log "INFO" "guix guix-informatics $(guix describe | grep gn-bioinformatics | cut -d ' ' -f 4)" || (log "ERROR" "Please make sure your current profile has gn-bioinformatics" && exit 1)
# Validate HOME is set
if [ -z "${HOME:-}" ]; then
log "ERROR" "HOME environment variable is not set"
exit 1
fi
if [ "$1" = "--init-container" ]; then
log "INFO" "Creating system directories..."
for dir in "${SYSTEM_DIRECTORIES[@]}"; do
# Check if directory exists and is accessible
if [ -d "$dir" ]; then
if [ -w "$dir" ]; then
log "DEBUG" "Directory exists and is writable: $dir"
else
log "WARNING" "Directory exists but is not writable: $dir. Making this writable"
sudo chown -R "$USER" "$dir"
fi
continue
fi
# Attempt to create directory
log "INFO" "Creating directory: $dir"
if [ -w "$(dirname "$dir")" ]; then
# Parent directory is writable, try without sudo
if ! mkdir -p "$dir"; then
log "ERROR" "Failed to create directory without sudo: $dir"
exit 1
fi
else
# Parent directory requires root, use sudo
if ! sudo mkdir -p "$dir"; then
log "ERROR" "Failed to create directory with sudo: $dir"
exit 1
fi
# Set ownership to current user if created with sudo
if ! sudo chown "$USER:$USER" "$dir"; then
log "WARNING" "Failed to set ownership for: $dir"
fi
fi
done
# Check and copy configuration files
log "INFO" "Checking and copying configuration files..."
for src in "${!FILE_MAPPINGS[@]}"; do
dest="${FILE_MAPPINGS[$src]}"
log "INFO" "Processing $src -> $dest"
# Check if source file exists
if [ ! -f "$src" ]; then
log "ERROR" "Source file does not exist: $src"
exit 1
fi
# Check if destination file exists
if [ ! -f "$dest" ]; then
log "INFO" "Destination file does not exist, copying $src to $dest"
mkdir -p "$(dirname "$dest")"
if ! cp "$src" "$dest"; then
log "ERROR" "Failed to copy $src to $dest"
exit 1
fi
continue
fi
# Compare files using diff
log "INFO" "Comparing $src with $dest"
if diff_output=$(diff -u "$dest" "$src" 2>&1); then
log "INFO" "Files $src and $dest are identical"
else
log "INFO" "Differences found between $src and $dest:"
echo "$diff_output" >&2
log "INFO" "Copying $src to $dest"
if ! cp "$src" "$dest"; then
log "ERROR" "Failed to copy $src to $dest"
exit 1
fi
fi
done
is_git_repository() {
local dir="$1"
# Check for standard repository
if [ -d "$dir/.git" ]; then
if [ -f "$dir/.git/HEAD" ] && [ -d "$dir/.git/refs" ]; then
log "DEBUG" "Detected standard Git repository: $dir"
return 0
else
log "ERROR" "Directory $dir/.git exists but is not a valid Git repository"
return 1
fi
# Check for bare repository
elif [ -f "$dir/HEAD" ] && [ -d "$dir/refs" ] && [ -d "$dir/objects" ]; then
log "DEBUG" "Detected bare Git repository: $dir"
return 0
else
log "ERROR" "$dir exists but is not a Git repository (neither standard nor bare)"
return 1
fi
}
# Clone GeneNetwork projects
log "INFO" "Cloning GeneNetwork projects..."
for project_entry in "${GN_PROJECTS[@]}"; do
IFS=':' read -r project repo_url <<< "$project_entry"
dir="$BASE_DIR/$project"
if [ ! -d "$dir" ]; then
log "INFO" "Cloning $project from $repo_url to $dir"
if ! git clone "$repo_url" "$dir"; then
log "ERROR" "Failed to clone $project"
exit 1
fi
else
log "DEBUG" "Directory exists, skipping clone: $dir"
if ! is_git_repository "$dir"; then
log "ERROR" "$dir exists but is not a Git repository"
exit 1
fi
fi
done
FLASK_SESSION="$BASE_DIR/genenetwork2/flask_session"
log "INFO" "Checking FLASK_SESSION directory: $FLASK_SESSION"
if [ ! -d "$FLASK_SESSION" ]; then
log "INFO" "Creating FLASK_SESSION directory: $FLASK_SESSION"
if ! mkdir -p "$FLASK_SESSION"; then
log "ERROR" "Failed to create FLASK_SESSION directory: $FLASK_SESSION"
exit 1
fi
else
log "DEBUG" "FLASK_SESSION directory already exists: $FLASK_SESSION"
fi
# Verify container SCM file exists
if [ ! -f "$CONTAINER_SCM" ]; then
log "ERROR" "Container SCM file not found: $CONTAINER_SCM"
exit 1
fi
# Create Guix system container
log "INFO" "Creating Guix system container..."
SHARE_OPTS=(
"--share=$BASE_DIR/var/log=/var/log"
"--share=$BASE_DIR/var/genenetwork=/var/genenetwork"
"--share=$BASE_DIR/etc/genenetwork/conf=/etc/genenetwork/conf"
"--share=$BASE_DIR/etc/genenetwork=/etc/genenetwork"
"--share=$BASE_DIR/var/lib/redis=/var/lib/redis"
"--share=$BASE_DIR/var/lib/virtuoso=/var/lib/virtuoso"
"--share=$BASE_DIR/var/lib/data=/var/lib/data"
"--share=$BASE_DIR/genenetwork2=/genenetwork2"
"--share=$BASE_DIR/genenetwork3=/genenetwork3"
"--share=$BASE_DIR/gn-auth=/gn-auth"
"--share=$BASE_DIR/var/lib/xapian=/var/lib/xapian"
"--share=$BASE_DIR/var/lib/genenetwork-sqlite=/var/lib/genenetwork-sqlite"
"--share=$BASE_DIR/var/lib/genenetwork-gnqa=/var/lib/genenetwork-gnqa"
"--share=/tmp/local-container=/tmp"
"--share=$BASE_DIR/gn-docs=/var/lib/gn-docs"
"--share=/run/mysqld=/run/mysqld"
)
container_script=$(guix system container \
--network \
--load-path=. \
--verbosity=3 \
"${SHARE_OPTS[@]}" \
"$CONTAINER_SCM")
log $container_script
# Create symbolic links
log "INFO" "Creating symbolic links..."
if ! sudo ln -sf "$container_script" "$CONTAINER_BIN"; then
log "ERROR" "Failed to create symbolic link: $CONTAINER_BIN"
exit 1
fi
if ! sudo ln -sf "$container_script" "$GC_ROOT"; then
log "ERROR" "Failed to create GC root link: $GC_ROOT"
exit 1
fi
log "INFO" "Setup completed successfully!"
log "INFO" "Container script: $container_script"
log "INFO" "Run with: $CONTAINER_BIN"
log "INFO" "Email: test@development.user"
log "INFO" "Password: testpasswd"
fi
if [ "$1" = "--init-sql" ]; then
# Configuration
URL="https://files.genenetwork.org/database/db_webqtl_s-2025-02-18.sql.xz"
DOWNLOAD_DIR="/tmp"
FILE_NAME=$(basename "$URL")
EXTRACTED_FILE="${FILE_NAME%.xz}"
DB_USER="webqtlout"
DB_PASSWORD="webqtlout"
DB_HOST="localhost"
DB_NAME="db_webqtl_local"
MYSQL_ROOT_USER="" # Change to your MySQL admin user if different
MYSQL_ROOT_PASSWORD="" # Set this or leave empty to prompt
# Check for required tools
for cmd in wget xz mysql; do
if ! command -v "$cmd" &> /dev/null; then
log ERROR "Required command '$cmd' not found"
exit 1
fi
done
# Download the file
log INFO "Downloading $URL to $DOWNLOAD_DIR/$FILE_NAME"
if ! wget -O "$DOWNLOAD_DIR/$FILE_NAME" "$URL"; then
log ERROR "Failed to download $URL"
exit 1
fi
# Extract the .xz file
log INFO "Extracting $DOWNLOAD_DIR/$FILE_NAME"
if ! xz -d "$DOWNLOAD_DIR/$FILE_NAME"; then
log ERROR "Failed to extract $DOWNLOAD_DIR/$FILE_NAME"
rm -f "$DOWNLOAD_DIR/$FILE_NAME"
exit 1
fi
# Prepare MySQL user and password credentials
if [ -z "$MYSQL_ROOT_USER" ]; then
log INFO "MySQL root user not set, prompting for input"
read -s -p "Enter MySQL user: " MYSQL_ROOT_USER
fi
if [ -z "$MYSQL_ROOT_PASSWORD" ]; then
log INFO "MySQL root password not set, prompting for input"
read -s -p "Enter MySQL root password: " MYSQL_ROOT_PASSWORD
fi
# Check if DB user exists, create if not
log INFO "Checking if MySQL user $DB_USER exists"
USER_EXISTS=$(mysql -h "$DB_HOST" -u "$MYSQL_ROOT_USER" -p"$MYSQL_ROOT_PASSWORD" -e "SELECT EXISTS(SELECT 1 FROM mysql.user WHERE user = '$DB_USER' AND host = 'localhost') AS user_exists;" 2>/dev/null | grep -o '[0-1]$')
if [ "$USER_EXISTS" = "0" ]; then
log INFO "Creating MySQL user $DB_USER"
if ! mysql -h "$DB_HOST" -u "$MYSQL_ROOT_USER" -p"$MYSQL_ROOT_PASSWORD" -e "CREATE USER '$DB_USER'@'localhost' IDENTIFIED BY '$DB_PASSWORD'; GRANT ALL PRIVILEGES ON $DB_NAME.* TO '$DB_USER'@'localhost'; FLUSH PRIVILEGES;" 2>/dev/null; then
log ERROR "Failed to create MySQL user $DB_USER"
rm -f "$DOWNLOAD_DIR/$EXTRACTED_FILE"
exit 1
fi
else
log INFO "User $DB_USER already exists, ensuring privileges"
if ! mysql -h "$DB_HOST" -u "$MYSQL_ROOT_USER" -p"$MYSQL_ROOT_PASSWORD" -e "GRANT ALL PRIVILEGES ON $DB_NAME.* TO '$DB_USER'@'localhost'; FLUSH PRIVILEGES;" 2>/dev/null; then
log ERROR "Failed to update privileges for $DB_USER"
rm -f "$DOWNLOAD_DIR/$EXTRACTED_FILE"
exit 1
fi
fi
# Create database if it doesn't exist
log INFO "Ensuring database $DB_NAME exists"
if ! mysql -h "$DB_HOST" -u "$MYSQL_ROOT_USER" -p"$MYSQL_ROOT_PASSWORD" -e "CREATE DATABASE IF NOT EXISTS $DB_NAME;" 2>/dev/null; then
log ERROR "Failed to create or verify database $DB_NAME"
rm -f "$DOWNLOAD_DIR/$EXTRACTED_FILE"
exit 1
fi
# Install the SQL dump into the database
log INFO "Importing $DOWNLOAD_DIR/$EXTRACTED_FILE into $DB_NAME"
if ! mysql -h "$DB_HOST" -u "$DB_USER" -p"$DB_PASSWORD" "$DB_NAME" < "$DOWNLOAD_DIR/$EXTRACTED_FILE"; then
log ERROR "Failed to import $DOWNLOAD_DIR/$EXTRACTED_FILE into $DB_NAME"
rm -f "$DOWNLOAD_DIR/$EXTRACTED_FILE"
exit 1
fi
# Clean up
log INFO "Removing $DOWNLOAD_DIR/$EXTRACTED_FILE"
rm -f "$DOWNLOAD_DIR/$EXTRACTED_FILE"
log INFO "Database import completed successfully"
exit 0
fi
if [ "$1" = "--init-rdf" ]; then
# Check for required tools
for cmd in guix; do
if ! command -v "$cmd" &> /dev/null; then
log ERROR "Required command '$cmd' not found"
exit 1
fi
done
log INFO "Please make sure your container is running for this to work"
log INFO "This takes some time to run"
# Check if directory exists and is accessible
if [ -d "$BASE_DIR/var/lib/data" ]; then
if [ -w "$BASE_DIR/var/lib/data" ]; then
log "DEBUG" "Directory exists and is writable: $BASE_DIR/var/lib/data"
else
log "WARNING" "Directory exists but is not writable: $BASE_DIR/var/lib/data. Making this writable"
sudo chown -R "$USER" "$BASE_DIR/var/lib/data"
fi
continue
fi
curr_dir="$PWD"
cd "$BASE_DIR/gn-transform-databases"
guix shell -m "manifest.scm" -- guile "generate-ttl-files.scm" \
--settings "$curr_dir/etc/conn.scm" --output "$BASE_DIR/var/lib/data"
guix shell guile-dbi -m "manifest.scm" -- guile load-rdf.scm \
"$curr_dir/etc/conn.scm"
cd $curr_dir
exit 0
fi
if [ "$1" = "--init-xapian" ]; then
# Check for required tools
log INFO "Please make sure your container is running for this to work"
log INFO "This takes some time to run"
# Check if directory exists and is accessible
if [ -d "$BASE_DIR/var/lib/xapian" ]; then
if [ -w "$BASE_DIR/var/lib/xapian" ]; then
log "DEBUG" "Directory exists and is writable: $BASE_DIR/var/lib/xapian"
else
log "WARNING" "Directory exists but is not writable: $BASE_DIR/var/lib/xapian. Making this writable"
sudo chown -R "$USER" "$BASE_DIR/var/lib/xapian"
fi
continue
fi
# Check if build directory exists
if [ ! -f "$BASE_DIR/var/lib/xapian/build" ]; then
rm -rf "$BASE_DIR/var/lib/xapian/build"
fi
env PYTHONPATH="$BASE_DIR/genenetwork3/" guix shell python-wrapper genenetwork3 \
--share="$BASE_DIR/var/lib/xapian" -- \
"$BASE_DIR/genenetwork3/scripts/index-genenetwork" create-xapian-index \
"$BASE_DIR/var/lib/xapian/build" \
"mysql://webqtlout:webqtlout@localhost/db_webqtl_local?unix_socket=/run/mysqld/mysqld.sock&charset=utf8" \
"http://localhost:7082/sparql"
mv "$BASE_DIR/var/lib/xapian/build/*" "$BASE_DIR/var/lib/xapian/" \
&& rmdir "$BASE_DIR/var/lib/xapian/build/"
log INFO "Please restart the container to set the correct permissions"
exit 0
fi
|