added FS to MultClfs.py and modified data for different splits for consistency
This commit is contained in:
parent
edb7aebd6a
commit
e2bc384155
12 changed files with 1585 additions and 994 deletions
|
@ -1,11 +1,13 @@
|
|||
=================================
|
||||
# Split: 70/30
|
||||
########################################################################
|
||||
|
||||
#70/30
|
||||
|
||||
########################################################################
|
||||
=-----------------------------------=
|
||||
# All features including AA index
|
||||
# Date: 22/06/2022
|
||||
# captures error: 2>$1
|
||||
# omitted drtype_labels
|
||||
=================================
|
||||
time ./run_7030.py -g pncA -d pyrazinamide 2>&1 | tee log_pnca_7030.txt
|
||||
# [WITH OR]
|
||||
=-----------------------------------=
|
||||
time ./run_7030.py -g pncA -d pyrazinamide 2>&1 | tee log_pnca_7030.txt #d
|
||||
time ./run_7030.py -g embB -d ethambutol 2>&1 | tee log_embb_7030.txt
|
||||
time ./run_7030.py -g katG -d isoniazid 2>&1 | tee log_katg_7030.txt
|
||||
time ./run_7030.py -g rpoB -d rifampicin 2>&1 | tee log_rpob_7030.txt
|
||||
|
@ -14,71 +16,155 @@ time ./run_7030.py -g alr -d cycloserine 2>&1 | tee log_alr_7030.txt
|
|||
|
||||
# alr: # ERROR, as expected, too few values!
|
||||
# gid: problems
|
||||
########################################################################
|
||||
|
||||
=================================
|
||||
# Split: 80/20
|
||||
=-----------------------------------=
|
||||
# All features including AA index
|
||||
# Date: 17/05/2022, 18:48
|
||||
# captures error: 2>$1
|
||||
=================================
|
||||
# [WITHOUT OR] **DONE
|
||||
#------------------------------------=
|
||||
time ./run_7030.py -g pncA -d pyrazinamide 2>&1 | tee log_pnca_7030_noOR.txt
|
||||
time ./run_7030.py -g embB -d ethambutol 2>&1 | tee log_embb_7030_noOR.txt
|
||||
time ./run_7030.py -g katG -d isoniazid 2>&1 | tee log_katg_7030_noOR.txt
|
||||
time ./run_7030.py -g rpoB -d rifampicin 2>&1 | tee log_rpob_7030_noOR.txt
|
||||
time ./run_7030.py -g gid -d streptomycin 2>&1 | tee log_gid_7030_noOR.txt
|
||||
time ./run_7030.py -g alr -d cycloserine 2>&1 | tee log_alr_7030_noOR.txt
|
||||
########################################################################
|
||||
|
||||
# 80/20
|
||||
|
||||
########################################################################
|
||||
|
||||
=================================
|
||||
# Split: scaling law
|
||||
=-----------------------------------=
|
||||
# All features including AA index
|
||||
# Date: 17/05/2022, 18:48
|
||||
# captures error: 2>$1
|
||||
=================================
|
||||
# [WITH OR]
|
||||
=-----------------------------------=
|
||||
time ./run_8020.py -g pncA -d pyrazinamide 2>&1 | tee log_pnca_8020.txt
|
||||
time ./run_8020.py -g embB -d ethambutol 2>&1 | tee log_embb_8020.txt
|
||||
time ./run_8020.py -g katG -d isoniazid 2>&1 | tee log_katg_8020.txt
|
||||
time ./run_8020.py -g rpoB -d rifampicin 2>&1 | tee log_rpob_8020.txt
|
||||
time ./run_8020.py -g gid -d streptomycin 2>&1 | tee log_gid_8020.txt
|
||||
time ./run_8020.py -g alr -d cycloserine 2>&1 | tee log_alr_8020.txt
|
||||
|
||||
|
||||
########################################################################
|
||||
=================================
|
||||
# Split: REVERSE training
|
||||
# imputed values: training set
|
||||
# actual values: blind set
|
||||
=-----------------------------------=
|
||||
# All features including AA index
|
||||
# Date: 18/05/2022
|
||||
# captures error: 2>$1
|
||||
=================================
|
||||
# [WITHOUT OR] **DONE
|
||||
real 0m1.099s
|
||||
user 0m1.308s
|
||||
sys 0m1.474s
|
||||
=-----------------------------------=
|
||||
time ./run_8020.py -g pncA -d pyrazinamide 2>&1 | tee log_pnca_8020_noOR.txt
|
||||
time ./run_8020.py -g embB -d ethambutol 2>&1 | tee log_embb_8020_noOR.txt
|
||||
time ./run_8020.py -g katG -d isoniazid 2>&1 | tee log_katg_8020_noOR.txt
|
||||
time ./run_8020.py -g rpoB -d rifampicin 2>&1 | tee log_rpob_8020_noOR.txt
|
||||
time ./run_8020.py -g gid -d streptomycin 2>&1 | tee log_gid_8020_noOR.txt
|
||||
time ./run_8020.py -g alr -d cycloserine 2>&1 | tee log_alr_8020_noOR.txt
|
||||
|
||||
########################################################################
|
||||
# COMPLETE Data: actual + na i.e imputed
|
||||
|
||||
# SL
|
||||
|
||||
########################################################################
|
||||
|
||||
=================================
|
||||
# Split: 70/30 [COMPLETE DATA]
|
||||
=-----------------------------------=
|
||||
# All features including AA index
|
||||
# Date: 18/05/2022
|
||||
# captures error: 2>$1
|
||||
=================================
|
||||
=-----------------------------------=
|
||||
|
||||
|
||||
########################################################################
|
||||
=================================
|
||||
# Split: 80/20 [COMPLETE DATA]
|
||||
|
||||
|
||||
|
||||
|
||||
=-----------------------------------=
|
||||
# All features including AA index
|
||||
# Date: 18/05/2022
|
||||
# captures error: 2>$1
|
||||
=================================
|
||||
# [WITHOUT OR]
|
||||
=-----------------------------------=
|
||||
time ./run_sl.py -g pncA -d pyrazinamide 2>&1 | tee log_pnca_sl_noOR.txt
|
||||
time ./run_sl.py -g embB -d ethambutol 2>&1 | tee log_embb_sl_noOR.txt
|
||||
time ./run_sl.py -g katG -d isoniazid 2>&1 | tee log_katg_sl_noOR.txt
|
||||
time ./run_sl.py -g rpoB -d rifampicin 2>&1 | tee log_rpob_sl_noOR.txt
|
||||
time ./run_sl.py -g gid -d streptomycin 2>&1 | tee log_gid_sl_noOR.txt
|
||||
time ./run_sl.py -g alr -d cycloserine 2>&1 | tee log_alr_sl_noOR.txt
|
||||
|
||||
=================================
|
||||
# Split: scaling law [COMPLETE DATA]
|
||||
########################################################################
|
||||
|
||||
|
||||
########################################################################
|
||||
########################################################################
|
||||
###################### COMPLETE DATA ##############################
|
||||
########################################################################
|
||||
########################################################################
|
||||
|
||||
|
||||
########################################################################
|
||||
|
||||
#70/30
|
||||
|
||||
########################################################################
|
||||
|
||||
|
||||
=-----------------------------------=
|
||||
# All features including AA index
|
||||
# Date: 18/05/2022
|
||||
# captures error: 2>$1
|
||||
=================================
|
||||
# [WITHOUT OR]
|
||||
#------------------------------------=
|
||||
time ./run_cd_7030.py -g pncA -d pyrazinamide 2>&1 | tee log_pnca_cd_7030_noOR.txt
|
||||
time ./run_cd_7030.py -g embB -d ethambutol 2>&1 | tee log_embb_cd_7030_noOR.txt
|
||||
time ./run_cd_7030.py -g katG -d isoniazid 2>&1 | tee log_katg_cd_7030_noOR.txt
|
||||
time ./run_cd_7030.py -g rpoB -d rifampicin 2>&1 | tee log_rpob_cd_7030_noOR.txt
|
||||
time ./run_cd_7030.py -g gid -d streptomycin 2>&1 | tee log_gid_cd_7030_noOR.txt
|
||||
time ./run_cd_7030.py -g alr -d cycloserine 2>&1 | tee log_alr_cd_7030_noOR.txt
|
||||
|
||||
|
||||
########################################################################
|
||||
|
||||
# 80/20
|
||||
|
||||
########################################################################
|
||||
|
||||
|
||||
|
||||
=-----------------------------------=
|
||||
# All features including AA index
|
||||
# [WITHOUT OR]
|
||||
#------------------------------------=
|
||||
time ./run_cd_8020.py -g pncA -d pyrazinamide 2>&1 | tee log_pnca_cd_8020_noOR.txt
|
||||
time ./run_cd_8020.py -g embB -d ethambutol 2>&1 | tee log_embb_cd_8020_noOR.txt
|
||||
time ./run_cd_8020.py -g katG -d isoniazid 2>&1 | tee log_katg_cd_8020_noOR.txt
|
||||
time ./run_cd_8020.py -g rpoB -d rifampicin 2>&1 | tee log_rpob_cd_8020_noOR.txt
|
||||
time ./run_cd_8020.py -g gid -d streptomycin 2>&1 | tee log_gid_cd_8020_noOR.txt
|
||||
time ./run_cd_8020.py -g alr -d cycloserine 2>&1 | tee log_alr_cd_8020_noOR.txt
|
||||
|
||||
########################################################################
|
||||
|
||||
# SL
|
||||
|
||||
########################################################################
|
||||
|
||||
|
||||
|
||||
=-----------------------------------=
|
||||
# All features including AA index
|
||||
# [WITHOUT OR]
|
||||
#------------------------------------=
|
||||
time ./run_cd_sl.py -g pncA -d pyrazinamide 2>&1 | tee log_pnca_cd_sl_noOR.txt
|
||||
time ./run_cd_sl.py -g embB -d ethambutol 2>&1 | tee log_embb_cd_sl_noOR.txt
|
||||
time ./run_cd_sl.py -g katG -d isoniazid 2>&1 | tee log_katg_cd_sl_noOR.txt
|
||||
time ./run_cd_sl.py -g rpoB -d rifampicin 2>&1 | tee log_rpob_cd_sl_noOR.txt
|
||||
time ./run_cd_sl.py -g gid -d streptomycin 2>&1 | tee log_gid_cd_sl_noOR.txt
|
||||
time ./run_cd_sl.py -g alr -d cycloserine 2>&1 | tee log_alr_cd_sl_noOR.txt
|
||||
|
||||
|
||||
|
||||
|
||||
########################################################################
|
||||
|
||||
########################################################################
|
||||
########################################################################
|
||||
###################### Feature Selection ##########################
|
||||
########################################################################
|
||||
########################################################################
|
||||
|
||||
# running feature selection
|
||||
# Split:70/30
|
||||
# 7030
|
||||
time ./run_FS.py -g pncA -d pyrazinamide 2>&1 | tee log_FS_pnca_7030.txt
|
||||
|
||||
real 338m26.705s
|
||||
user 1946m12.173s
|
||||
sys 189m40.122s
|
||||
|
||||
time ./run_FS_7030.py -g pncA -d pyrazinamide 2>&1 | tee log_FS_pnca_7030_noOR.txt
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue