87 lines
2.5 KiB
Python
87 lines
2.5 KiB
Python
#!/usr/bin/env python3
|
|
# -*- coding: utf-8 -*-
|
|
"""
|
|
Created on Mon Jun 20 13:05:23 2022
|
|
|
|
@author: tanu
|
|
"""
|
|
#==================
|
|
# Baseline models
|
|
#==================
|
|
cm_di2 = MultModelsCl_dissected(input_df = X
|
|
, target = y
|
|
, var_type = 'mixed'
|
|
, skf_cv = skf_cv
|
|
, blind_test_input_df = X_bts
|
|
, blind_test_target = y_bts
|
|
, add_cm = True
|
|
, add_yn = True)
|
|
|
|
baseline_all2 = pd.DataFrame(cm_di2)
|
|
baseline_all2 = baseline_all2.T
|
|
baseline_CTBT2 = baseline_all2.filter(regex = 'test_.*|bts_.*|TN|FP|FN|TP|.*_neg|.*_pos' , axis = 1)
|
|
|
|
#================
|
|
# Stability cols
|
|
#================
|
|
|
|
|
|
#================
|
|
# Affinity cols
|
|
#================
|
|
|
|
|
|
#================
|
|
# Residue level
|
|
#================
|
|
|
|
|
|
#================
|
|
# Genomics
|
|
# X_genomicFN
|
|
#================
|
|
feature_gp_name = 'genomics'
|
|
|
|
scores_mm_gn = MultModelsCl_dissected(input_df = X[X_genomicFN]
|
|
, target = y
|
|
, var_type = 'mixed'
|
|
, skf_cv = skf_cv
|
|
, blind_test_input_df = X_bts[X_genomicFN]
|
|
, blind_test_target = y_bts
|
|
, add_cm = True
|
|
, add_yn = True)
|
|
|
|
baseline_all_gn = pd.DataFrame(scores_mm_gn)
|
|
baseline_CTBT_gn = baseline_all_gn.filter(regex = '.*_time|test_.*|bts_.*|TN|FP|FN|TP|.*_neg|.*_pos' , axis = 0)
|
|
baseline_CTBT_gn['feature_group'] = feature_gp_name
|
|
|
|
|
|
|
|
baseline_CT = baseline_CTBT_gn.filter(regex = '.*_time|test_.*|TN|FP|FN|TP|.*_neg|.*_pos', axis = 0)
|
|
|
|
baseline_CT = baseline_CT.reset_index()
|
|
baseline_CT.rename(columns = {'index': 'original_index'}, inplace = True)
|
|
baseline_CT['score_type'] = baseline_CT['original_index']
|
|
baseline_CT['score_type'] = baseline_CT['score_type'].str.replace('test_*', '', regex = True)
|
|
baseline_CT['data_source'] = 'CT_score'
|
|
|
|
|
|
baseline_BT = baseline_CTBT_gn.filter(regex = 'bts_', axis = 0)
|
|
baseline_BT = baseline_BT.reset_index()
|
|
baseline_BT.rename(columns = {'index': 'original_index'}, inplace = True)
|
|
baseline_BT['score_type'] = baseline_BT['original_index']
|
|
baseline_BT['score_type'] = baseline_BT['score_type'].str.replace('bts_*', '', regex = True)
|
|
baseline_BT['data_source'] = 'BT_score'
|
|
|
|
# rpow bind
|
|
if all(baseline_CT.columns == baseline_BT.columns):
|
|
print('\nPASS:colnames match, proceeding to rowbind')
|
|
comb_df = pd.concat([baseline_BT,baseline_CT], axis = 0, ignore_index = True )
|
|
|
|
baseline_CT
|
|
baseline_CT
|
|
|
|
#================
|
|
# Evolution
|
|
#================
|
|
|