diff options
Diffstat (limited to 'utility/catalog_process.py')
-rw-r--r-- | utility/catalog_process.py | 10 |
1 files changed, 10 insertions, 0 deletions
diff --git a/utility/catalog_process.py b/utility/catalog_process.py new file mode 100644 index 0000000..7841e54 --- /dev/null +++ b/utility/catalog_process.py @@ -0,0 +1,10 @@ +import pandas as pd +col_list = ['PUBMEDID', 'DISEASE/TRAIT', 'REPORTED GENE(S)', 'MAPPED_GENE', 'MAPPED_TRAIT', 'P-VALUE', 'SNPS'] +datf = pd.read_csv('gwas_catalog_v1.0.2-associations_e100_r2021-05-05.tsv', sep='\t', usecols=col_list) + +datf_sub = datf[datf['DISEASE/TRAIT'].str.contains('addiction')] + +print(datf_sub) + +#datf2 = pd.read_csv('gwas_catalog_v1.0.2-associations_e100_r2021-05-05.tsv', sep='\t') +#print(datf2.shape) |