# =============================================================================
# TRAIN_FILE = "data/20201126deepfm_feature_dmp_xgboost.csv"
# TRAIN_FILE = "data/20201126deepfm_feature_dmp_lasso.csv"
# TRAIN_FILE = "data/20201126deepfm_feature_dmp_lassoxgboost.csv"
# TRAIN_FILE = "data/20201126deepfm_feature_cor_xgboost.csv"
# TRAIN_FILE = "data/20201126deepfm_feature_cor_lasso.csv"
# TRAIN_FILE = "data/20201126deepfm_feature_cor_lassoxgboost.csv"
# TEST_FILE = "data/20201126deepfm_feature_dmp_xgboost_test.csv"
# TEST_FILE = "data/20201126deepfm_feature_dmp_lasso_test.csv"
# TEST_FILE = "data/20201126deepfm_feature_dmp_lassoxgboost_test.csv"
# TEST_FILE = "data/20201126deepfm_feature_cor_xgboost_test.csv"
# TEST_FILE = "data/20201126deepfm_feature_cor_lasso_test.csv"
# TEST_FILE = "data/20201126deepfm_feature_cor_lassoxgboost_test.csv"
# =============================================================================
#id3
# =============================================================================
# TRAIN_FILE = "data/20201126deepfm_feature_rm_cg05481257_dmp_lassoxgboost.csv"
# TEST_FILE = "data/20201126deepfm_feature_rm_cg05481257_dmp_lassoxgboost_test.csv"
# =============================================================================
TRAIN_FILE = "data/20201126deepfm_feature_dmp_lassoxgboost.csv"
#TEST_FILE = "data/20201126deepfm_feature_dmp_lassoxgboost_4years_test.csv"
TEST_FILE = "data/20201126deepfm_feature_dmp_lassoxgboost_test.csv"
#TEST_FILE = "data/20201126deepfm_feature_cor_lassoxgboost_woman_test.csv"
#50,25percentage,batch_size=100
#6,4 years ;batch_size=100
SUB_DIR = "output"
# =============================================================================
# "cg00522231","cg05845376","cg07041999","cg17766026","cg24205914",
# "cg08101977","cg25755428","cg05363438","cg13352914","cg03233656",
# "cg05481257","cg03556243","cg16781992","cg10083824","cg08614290",
# "cg21429551","cg00045910","cg10556349","cg21024264","cg27401945",
# "cg06344265","cg20051875","cg23299445","cg00495303","cg11853697"
# =============================================================================
NUM_SPLITS = 3
RANDOM_SEED = 2017
# types of columns of the dataset dataframe
CATEGORICAL_COLS = [
#id1 = DMP xgboost
#"HRX8"
#id2 = DMP lasso
#"Sulfonamides","Angiotensin_II_antagonists","chd","afx","HRX8",
#"atrial_enlargement","rheumatic","aortic_valve","rheumatoid_arthritis"
#id3 = DMP lasso xgboost
"Sulfonamides"
#id4 = cor xgboost
#id5 = cor lasso
#"Sulfonamides","rheumatic","aortic_valve"
#id6 = cor lasso xgboost
]
NUMERIC_COLS = [
#id1 = DMP xgboost
# =============================================================================
# "AGE8","BMI8","Albumin_urine",
# "cg10501210","cg17280346","cg19025234","cg18319852","cg22367191",
# "cg24205914","cg24530234","cg25755428","cg01588224","cg03341469",
# "cg05365735","cg14975410","cg23450509","cg16781992","cg15421911",
# "cg23125993","cg26624398","cg27604145","cg12560772","cg08614290",
# "cg23447239","cg00285394","cg10210397","cg10556349","cg24892069",
# "cg27401945","cg06344265","cg12603632","cg01259782","cg05107535",
# "cg09547119","cg01346718"
# =============================================================================
# =============================================================================
# #id2 = DMP lasso
# "AGE8","BMI8","CREAT8","Albumin_urine",
# "cg16986315","cg00522231","cg01227537","cg05845376","cg06883126",
# "cg19025234","cg07041999","cg17766026","cg24205914","cg21481937",
# "cg08101977","cg25755428","cg03341469","cg05363438","cg08702915",
# "cg13352914","cg03233656","cg05481257","cg12682972","cg25138327",
# "cg25552548","cg03556243","cg10098541","cg14975410","cg04573661",
# "cg16781992","cg07705913","cg11925729","cg15421911","cg06386482",
# "cg10083824","cg12560772","cg23049448","cg03453431","cg08614290",
# "cg14017689","cg17067544","cg21429551","cg21807944","cg00327383",
# "cg16196274","cg23180489","cg13741668","cg00045910","cg00639447",
# "cg10556349","cg21024264","cg27401945","cg06344265","cg10253640",
# "cg06021880","cg20051875","cg00893603","cg23299445","cg00876127",
# "cg01046070","cg05107535","cg05917111","cg00495303","cg00706441",
# "cg13672791","cg25481705","cg10339152","cg11853697","cg11861654",
# "cg18965930","cg20810198"
# =============================================================================
#id3 = DMP lasso xgboost
"AGE8","BMI8","CREAT8","Albumin_urine",
"cg00522231","cg05845376","cg07041999","cg17766026","cg24205914",
"cg08101977","cg25755428","cg05363438","cg13352914","cg03233656",
"cg05481257","cg03556243","cg16781992","cg10083824","cg08614290",
"cg21429551","cg00045910","cg10556349","cg21024264","cg27401945",
"cg06344265","cg20051875","cg23299445","cg00495303","cg11853697"
# =============================================================================
# #id4 = cor xgboost
# "AGE8",
# "cg04836151","cg06976250","cg00028135","cg08360599","cg08980837",
# "cg11955727","cg12634591","cg15062216","cg17765025","cg17826763",
# "cg19906777","cg19916364","cg20346503","cg23111655","cg25256723",
# "cg03262554","cg06295856","cg08302325","cg08614290","cg12662162",
# "cg21349849","cg26472118","cg27476810","cg00495303","cg02992098",
# "cg04943661","cg12371587","cg22706883","cg26367719"
# =============================================================================
# =============================================================================
# #id5 = cor lasso
# "AGE8","CREAT8","FASTING_BG8","Albumin_urine",
# "cg00209038","cg03835609","cg05120156","cg09760889","cg12974637",
# "cg15159605","cg17766026","cg20793089","cg21481937","cg24205914",
# "cg25754958","cg27232078","cg01627483","cg02302795","cg02493740",
# "cg03341469","cg03879180","cg11947712","cg11955727","cg11969526",
# "cg12634591","cg13380669","cg19453991","cg20702802","cg23542948",
# "cg25552548","cg00258873","cg01676795","cg08614290","cg09798536",
# "cg12743894","cg13830081","cg14473597","cg15493780","cg16196274",
# "cg17674495","cg20707765","cg24822529","cg04465730","cg05072413",
# "cg06021880","cg08809333","cg13932794","cg16538366","cg19841423",
# "cg20051875","cg27333018"
# =============================================================================
# =============================================================================
# #id6 = cor lasso xgboost
# "AGE8","FASTING_BG8",
# "cg05120156","cg25754958","cg00209038","cg02302795","cg11947712",
# "cg03879180","cg11955727","cg11969526","cg12634591","cg19453991",
# "cg23542948","cg24822529","cg01676795","cg08614290","cg06021880",
# "cg13932794"
# =============================================================================
]
IGNORE_COLS = [
"ID",
"target"
]