aboutsummaryrefslogtreecommitdiff
path: root/gnqa/paper1_eval/src/run_human_datasets.sh
blob: 6f55d6d3c22f105856c14ab22727ecfca44da5b6 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
#!/bin/bash

#echo "Evaluating dataset of questions from domainexperts on the topic of general GN information."
#python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/human/dataset_domainexpert_general_1.json data/results/human/scores_de_gn_1.json 3
#sleep 60
#python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/human/dataset_domainexpert_general_2.json data/results/human/scores_de_gn_2.json 3
#sleep 60
#python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/human/dataset_domainexpert_general_3.json data/results/human/scores_de_gn_3.json 3
#sleep 60
#python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/human/dataset_domainexpert_general_4.json data/results/human/scores_de_gn_4.json 3
#sleep 60
#python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/human/dataset_domainexpert_general_5.json data/results/human/scores_de_gn_5.json 3
#sleep 60
#python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/human/dataset_domainexpert_general_6.json data/results/human/scores_de_gn_6.json 3
#sleep 60
#echo "Evaluating dataset of questions from domainexpert in the topic of aging"
#python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/human/dataset_domainexpert_aging_1.json data/results/human/scores_de_aging_1.json 3
#sleep 60
#python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/human/dataset_domainexpert_aging_2.json data/results/human/scores_de_aging_2.json 3
#sleep 60
#echo "Evaluating dataset of questions from domainexpert in the topic of diabetes"
#python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/human/dataset_domainexpert_diabetes_1.json data/results/human/scores_de_diabetes_1.json 3
#sleep 60
#python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/human/dataset_domainexpert_diabetes_2.json data/results/human/scores_de_diabetes_2.json 3
#sleep 60
#echo "Evaluating dataset of questions from citizenscientist in the topic of general"
#python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/human/dataset_citizenscientist_general_1.json data/results/human/scores_cs_gn_1.json 3
#python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/human/dataset_citizenscientist_general_2.json data/results/human/scores_cs_gn_2.json 3
#sleep 30
#python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/human/dataset_citizenscientist_general_3.json data/results/human/scores_cs_gn_3.json 3
#sleep 30
#python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/human/dataset_citizenscientist_general_4.json data/results/human/scores_cs_gn_4.json 3
#sleep 30
##python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/human/dataset_citizenscientist_general_5.json data/results/human/scores_cs_gn_5.json 3
##sleep 30
#python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/human/dataset_citizenscientist_general_6.json data/results/human/scores_cs_gn_6.json 3
#sleep 30
#python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/human/dataset_citizenscientist_general_7.json data/results/human/scores_cs_gn_7.json 3
#echo "Evaluating dataset of questions from citizenscientist in the topic of aging"
#python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/human/dataset_citizenscientist_aging_1.json data/results/human/scores_cs_aging_1.json 3
#sleep 30
#python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/human/dataset_citizenscientist_aging_2.json data/results/human/scores_cs_aging_2.json 3
#sleep 30
#python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/human/dataset_citizenscientist_aging_3.json data/results/human/scores_cs_aging_3.json 3
#sleep 30
#echo "Evaluating dataset of questions from citizenscientist in the topic of diabetes"
#python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/human/dataset_citizenscientist_diabetes_1.json data/results/human/scores_cs_diabetes_1.json 3
#sleep 30
#python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/human/dataset_citizenscientist_diabetes_2.json data/results/human/scores_cs_diabetes_2.json 3
#sleep 30
#python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/human/dataset_citizenscientist_diabetes_3.json data/results/human/scores_cs_diabetes_3.json 3
#sleep 30
#python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/human/dataset_citizenscientist_diabetes_4.json data/results/human/scores_cs_diabetes_4.json 3
#sleep 30

echo "Evaluating dataset of queriestion from citizen scientist on the diabetes topics, generated by gpt4o"
python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/gpt4o/dataset_citizenscientist_gn_2.json data/results/gpt4o/scores_cs_gn.json 3
#sleep 60
#python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/gpt4o/dataset_citizenscientist_diabetes_2.json data/results/gpt4o/scores_cs_diabetes.json 3
#sleep 60
#python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/gpt4o/dataset_citizenscientist_diabetes_3.json data/results/gpt4o/scores_cs_diabetes.json 3
#sleep 60
#python3 ragas_fahamuRAG.py /home/shebes/code/GN-LLM-Hacking/gnqa_eval/src/data/datasets/gpt4o/dataset_citizenscientist_diabetes_4.json data/results/gpt4o/scores_cs_diabetes.json 3