trying under and oversampling

This commit is contained in:
Tanushree Tunstall 2022-05-26 07:38:21 +01:00
parent 8f8306d948
commit 5779331981
5 changed files with 129 additions and 16 deletions

View file

@ -7,7 +7,7 @@ Created on Tue Mar 15 11:09:50 2022
"""
#%% Data
X = all_df_wtgt[numerical_FN+categorical_FN]
y = all_df_wtgt['mutation_class']
y = all_df_wtgt[drug]
#y = all_df_wtgt['dst_mode']
#%% variables
@ -17,9 +17,40 @@ mm_skf_scoresD = MultClassPipeSKFCV(input_df = X
, var_type = 'mixed'
, skf_cv = skf_cv)
mm_skf_scores_df_all = pd.DataFrame(mm_skf_scoresD)
mm_skf_scores_df_all
mm_skf_scores_df_test = mm_skf_scores_df_all.filter(like='test_', axis=0)
mm_skf_scores_df_train = mm_skf_scores_df_all.filter(like='train_', axis=0) # helps to see if you trust the results
]
#%%
mm_skf_scoresD2 = MultClassPipeSKFCV(input_df = X_sm
, target = y_sm
, var_type = 'mixed'
, skf_cv = skf_cv)
sm_all = pd.DataFrame(mm_skf_scoresD2)
sm_df_CT = sm_all.filter(like='test_', axis=0)
#%%
mm_skf_scoresD3 = MultClassPipeSKFCV(input_df = X_ros
, target = y_ros
, var_type = 'mixed'
, skf_cv = skf_cv)
ros_all = pd.DataFrame(mm_skf_scoresD3)
ros_CT = ros_all.filter(like='test_', axis=0)
#%%
mm_skf_scoresD4 = MultClassPipeSKFCV(input_df = X_rus
, target = y_rus
, var_type = 'mixed'
, skf_cv = skf_cv)
rus_all = pd.DataFrame(mm_skf_scoresD4)
rus_CT = rus_all.filter(like='test_', axis=0)
#%%
mm_skf_scoresD5 = MultClassPipeSKFCV(input_df = X_enn
, target = y_enn
, var_type = 'mixed'
, skf_cv = skf_cv)
enn_all = pd.DataFrame(mm_skf_scoresD5)
enn_CT = enn_all.filter(like='test_', axis=0)