a b/kgwas/params.py
1
## The raw UKBB genotype data paths. If you have access to it, please modify the paths accordingly. 
2
cohort_data_path = '/dfs/project/datasets/20220524-ukbiobank/data/cohort/'
3
ukbb_data_path = '/dfs/project/datasets/20220524-ukbiobank/data/genetics/'
4
main_data_path = '/dfs/project/datasets/20220524-ukbiobank/data/ukb_main/ukb52124.csv'
5
kinship_path = '/dfs/project/datasets/20220524-ukbiobank/data/genetics/ukb_rel_a79791_s488170.dat'
6
withdraw_path = '/dfs/project/datasets/20220524-ukbiobank/data/withdraw'
7
fam_path = '/dfs/project/datasets/20220524-ukbiobank/data/genetics/ukb_lmdb_fam.csv'
8
bim_path = '/dfs/project/datasets/20220524-ukbiobank/data/genetics/ukb_lmdb_bim.csv'
9
10
scdrs_traits = ['UKB_460K.mental_NEUROTICISM',
11
 'PASS_FastingGlucose_Manning',
12
 'PASS_Lupus',
13
 'UKB_460K.biochemistry_HbA1c',
14
 'PASS_ADHD_Demontis2018',
15
 'UKB_460K.bmd_HEEL_TSCOREz',
16
 'UKB_460K.disease_HYPOTHYROIDISM_SELF_REP',
17
 'UKB_460K.blood_LYMPHOCYTE_COUNT',
18
 'PASS_Insomnia_Jansen2019',
19
 'UKB_460K.other_MORNINGPERSON',
20
 'UKB_460K.cov_SMOKING_STATUS',
21
 'UKB_460K.biochemistry_TotalBilirubin',
22
 'PASS_BIP_Stahl2019',
23
 'UKB_460K.biochemistry_HDLcholesterol',
24
 'PASS_UC_deLange2017',
25
 'UKB_460K.pigment_HAIR',
26
 'UKB_460K.body_HEIGHTz',
27
 'PASS_Worry_Nagel2018',
28
 'PASS_Type_2_Diabetes',
29
 'UKB_460K.body_BMIz',
30
 'UKB_460K.disease_HYPERTENSION_DIAGNOSED',
31
 'PASS_Primary_biliary_cirrhosis',
32
 'UKB_460K.blood_RED_COUNT',
33
 'UKB_460K.disease_CARDIOVASCULAR',
34
 'PASS_DrinksPerWeek_Liu2019',
35
 'PASS_SWB',
36
 'PASS_VerbalNumericReasoning_Davies2018',
37
 'UKB_460K.biochemistry_AlkalinePhosphatase',
38
 'UKB_460K.bp_DIASTOLICadjMEDz',
39
 'UKB_460K.disease_RESPIRATORY_ENT',
40
 'UKB_460K.biochemistry_Cholesterol',
41
 'PASS_Alzheimers_Jansen2019',
42
 'UKB_460K.repro_NumberChildrenEverBorn_Pooled',
43
 'UKB_460K.biochemistry_Triglycerides',
44
 'UKB_460K.body_BALDING1',
45
 'PASS_Coronary_Artery_Disease',
46
 'UKB_460K.blood_PLATELET_COUNT',
47
 'PASS_Multiple_sclerosis',
48
 'UKB_460K.disease_AID_ALL',
49
 'UKB_460K.repro_MENOPAUSE_AGE',
50
 'PASS_Type_1_Diabetes',
51
 'UKB_460K.lung_FVCzSMOKE',
52
 'UKB_460K.blood_EOSINOPHIL_COUNT',
53
 'UKB_460K.cancer_BREAST',
54
 'UKB_460K.repro_MENARCHE_AGE',
55
 'PASS_Intelligence_SavageJansen2018',
56
 'PASS_ReactionTime_Davies2018',
57
 'UKB_460K.biochemistry_SHBG',
58
 'UKB_460K.blood_WHITE_COUNT',
59
 'PASS_AtrialFibrillation_Nielsen2018',
60
 'UKB_460K.blood_MONOCYTE_COUNT',
61
 'UKB_460K.biochemistry_LDLdirect',
62
 'UKB_460K.biochemistry_TotalProtein',
63
 'UKB_460K.blood_MEAN_CORPUSCULAR_HEMOGLOBIN',
64
 'UKB_460K.cov_EDU_COLLEGE',
65
 'UKB_460K.body_WHRadjBMIz',
66
 'PASS_IBD_deLange2017',
67
 'PASS_SleepDuration_Dashti2019',
68
 'PASS_BIP_Mullins2021',
69
 'UKB_460K.cov_EDU_YEARS',
70
 'UKB_460K.bp_SYSTOLICadjMEDz',
71
 'UKB_460K.disease_ALLERGY_ECZEMA_DIAGNOSED',
72
 'UKB_460K.disease_ASTHMA_DIAGNOSED',
73
 'PASS_Schizophrenia_Pardinas2018',
74
 'PASS_Rheumatoid_Arthritis',
75
 'UKB_460K.lung_FEV1FVCzSMOKE',
76
 'PASS_Celiac',
77
 'UKB_460K.biochemistry_Glucose',
78
 'PASS_MDD_Howard2019',
79
 'PASS_GeneralRiskTolerance_KarlssonLinner2019',
80
 'PASS_CD_deLange2017',
81
 'UKB_460K.biochemistry_Testosterone_Male',
82
 'UKB_460K.blood_RBC_DISTRIB_WIDTH',
83
 'UKB_460K.impedance_BASAL_METABOLIC_RATEz',
84
 'UKB_460K.biochemistry_AlanineAminotransferase']