more plot files
This commit is contained in:
parent
04253b961f
commit
3d817fde0c
29 changed files with 3252 additions and 760 deletions
363
scripts/plotting/plotting_thesis/gid/basic_barplots_gid.R
Normal file
363
scripts/plotting/plotting_thesis/gid/basic_barplots_gid.R
Normal file
|
@ -0,0 +1,363 @@
|
|||
#!/usr/bin/env Rscript
|
||||
#########################################################
|
||||
# TASK: Barplots
|
||||
# basic barplots with outcome
|
||||
# basic barplots with frequency of count of mutations
|
||||
#########################################################
|
||||
#=============
|
||||
# Data: Input
|
||||
#==============
|
||||
#source("~/git/LSHTM_analysis/config/gid.R")
|
||||
#source("~/git/LSHTM_analysis/scripts/plotting/get_plotting_dfs.R")
|
||||
#cat("\nSourced plotting cols as well:", length(plotting_cols))
|
||||
|
||||
####################################################
|
||||
class(merged_df3)
|
||||
|
||||
df3 = subset(merged_df3, select = -c(pos_count))
|
||||
|
||||
#=======
|
||||
# output
|
||||
#=======
|
||||
outdir_images = paste0("~/git/Writing/thesis/images/results/", tolower(gene), "/")
|
||||
cat("plots will output to:", outdir_images)
|
||||
|
||||
##########################################################
|
||||
# blue, red bp
|
||||
sts = 8
|
||||
lts = 8
|
||||
ats = 8
|
||||
als = 8
|
||||
ltis = 8
|
||||
geom_ls = 2.2
|
||||
|
||||
#pos_count
|
||||
subtitle_size = 8
|
||||
geom_ls_pc = 2.2
|
||||
leg_text_size = 8
|
||||
axis_text_size = 8
|
||||
axis_label_size = 8
|
||||
|
||||
###########################################################
|
||||
#------------------------------
|
||||
# plot default sizes
|
||||
#------------------------------
|
||||
#=========================
|
||||
# Affinity outcome
|
||||
# check this var: outcome_cols_affinity
|
||||
# get from preformatting or put in globals
|
||||
#==========================
|
||||
DistCutOff
|
||||
LigDist_colname # = "ligand_distance" # from globals
|
||||
ppi2Dist_colname
|
||||
naDist_colname
|
||||
|
||||
###########################################################
|
||||
# get plotting data within the distance
|
||||
df3_lig = df3[df3[[LigDist_colname]]<DistCutOff,]
|
||||
df3_ppi2 = df3[df3[[ppi2Dist_colname]]<DistCutOff,]
|
||||
df3_na = df3[df3[[naDist_colname]]<DistCutOff,]
|
||||
common_bp_title = paste0("Sites <", DistCutOff, angstroms_symbol)
|
||||
|
||||
#------------------------------
|
||||
# barplot for ligand affinity:
|
||||
# <10 Ang of ligand
|
||||
#------------------------------
|
||||
mLigP = stability_count_bp(plotdf = df3_lig
|
||||
, df_colname = "ligand_outcome"
|
||||
#, leg_title = "mCSM-lig"
|
||||
#, bp_plot_title = paste(common_bp_title, "ligand")
|
||||
, yaxis_title = "Number of nsSNPs"
|
||||
, leg_position = "none"
|
||||
, subtitle_text = "mCSM\nLig"
|
||||
, bar_fill_values = c("#F8766D", "#00BFC4")
|
||||
, subtitle_colour= "black"
|
||||
, sts = sts
|
||||
, lts = lts
|
||||
, ats = ats
|
||||
, als = als
|
||||
, ltis = ltis
|
||||
, geom_ls = geom_ls
|
||||
)
|
||||
mLigP
|
||||
#------------------------------
|
||||
# barplot for ligand affinity:
|
||||
# <10 Ang of ligand
|
||||
# mmCSM-lig: will be the same no. of sites but the effect will be different
|
||||
#------------------------------
|
||||
mmLigP = stability_count_bp(plotdf = df3_lig
|
||||
, df_colname = "mmcsm_lig_outcome"
|
||||
#, leg_title = "mmCSM-lig"
|
||||
#, label_categories = labels_mmlig
|
||||
#, bp_plot_title = paste(common_bp_title, "ligand")
|
||||
|
||||
, yaxis_title = ""
|
||||
, leg_position = "none"
|
||||
, subtitle_text = "mmCSM\nLig"
|
||||
, bar_fill_values = c("#F8766D", "#00BFC4")
|
||||
, subtitle_colour= "black"
|
||||
, sts = sts
|
||||
, lts = lts
|
||||
, ats = ats
|
||||
, als = als
|
||||
, ltis = ltis
|
||||
, geom_ls = geom_ls
|
||||
)
|
||||
mmLigP
|
||||
#------------------------------
|
||||
# barplot for ppi2 affinity
|
||||
# <10 Ang of interface
|
||||
#------------------------------
|
||||
if (tolower(gene)%in%geneL_ppi2){
|
||||
ppi2P = stability_count_bp(plotdf = df3_ppi2
|
||||
, df_colname = "mcsm_ppi2_outcome"
|
||||
#, leg_title = "mCSM-ppi2"
|
||||
#, label_categories = labels_ppi2
|
||||
#, bp_plot_title = paste(common_bp_title, "PP-interface")
|
||||
|
||||
, yaxis_title = "Number of nsSNPs"
|
||||
, leg_position = "none"
|
||||
, subtitle_text = "mCSM\nPPI2"
|
||||
, bar_fill_values = c("#F8766D", "#00BFC4")
|
||||
, subtitle_colour= "black"
|
||||
, sts = sts
|
||||
, lts = lts
|
||||
, ats = ats
|
||||
, als = als
|
||||
, ltis = ltis
|
||||
, geom_ls = geom_ls
|
||||
)
|
||||
ppi2P
|
||||
}
|
||||
#----------------------------
|
||||
# barplot for ppi2 affinity
|
||||
# <10 Ang of interface
|
||||
#------------------------------
|
||||
if (tolower(gene)%in%geneL_na){
|
||||
nca_distP = stability_count_bp(plotdf = df3_na
|
||||
, df_colname = "mcsm_na_outcome"
|
||||
#, leg_title = "mCSM-NA"
|
||||
#, label_categories =
|
||||
#, bp_plot_title = paste(common_bp_title, "Dist to NA")
|
||||
|
||||
, yaxis_title = "Number of nsSNPs"
|
||||
, leg_position = "none"
|
||||
, subtitle_text = "mCSM\nNA"
|
||||
, bar_fill_values = c("#F8766D", "#00BFC4")
|
||||
, subtitle_colour= "black"
|
||||
, sts = sts
|
||||
, lts = lts
|
||||
, ats = ats
|
||||
, als = als
|
||||
, ltis = ltis
|
||||
, geom_ls = geom_ls
|
||||
)
|
||||
nca_distP
|
||||
}
|
||||
|
||||
#####################################################################
|
||||
# ------------------------------
|
||||
# bp site site count: mCSM-lig
|
||||
# < 10 Ang ligand
|
||||
# ------------------------------
|
||||
common_bp_title = paste0("Sites <", DistCutOff, angstroms_symbol)
|
||||
|
||||
posC_lig = site_snp_count_bp(plotdf = df3_lig
|
||||
, df_colname = "position"
|
||||
, xaxis_title = "Number of nsSNPs"
|
||||
, yaxis_title = "Number of Sites"
|
||||
, subtitle_colour = "chocolate4"
|
||||
, subtitle_text = ""
|
||||
, subtitle_size = subtitle_size
|
||||
, geom_ls = geom_ls_pc
|
||||
, leg_text_size = leg_text_size
|
||||
, axis_text_size = axis_text_size
|
||||
, axis_label_size = axis_label_size)
|
||||
|
||||
posC_lig
|
||||
#------------------------------
|
||||
# bp site site count: ppi2
|
||||
# < 10 Ang interface
|
||||
#------------------------------
|
||||
if (tolower(gene)%in%geneL_ppi2){
|
||||
posC_ppi2 = site_snp_count_bp(plotdf = df3_ppi2
|
||||
, df_colname = "position"
|
||||
, xaxis_title = "Number of nsSNPs"
|
||||
, yaxis_title = "Number of Sites"
|
||||
, subtitle_colour = "chocolate4"
|
||||
, subtitle_text = ""
|
||||
, subtitle_size = subtitle_size
|
||||
, geom_ls = geom_ls_pc
|
||||
, leg_text_size = leg_text_size
|
||||
, axis_text_size = axis_text_size
|
||||
, axis_label_size = axis_label_size)
|
||||
posC_ppi2
|
||||
}
|
||||
|
||||
#------------------------------
|
||||
# bp site site count: NCA dist
|
||||
# < 10 Ang nca
|
||||
#------------------------------
|
||||
if (tolower(gene)%in%geneL_na){
|
||||
posC_nca = site_snp_count_bp(plotdf = df3_na
|
||||
, df_colname = "position"
|
||||
, xaxis_title = "Number of nsSNPs"
|
||||
, yaxis_title = "Number of Sites"
|
||||
, subtitle_colour = "chocolate4"
|
||||
, subtitle_text = ""
|
||||
, subtitle_size = subtitle_size
|
||||
, geom_ls = geom_ls_pc
|
||||
, leg_text_size = leg_text_size
|
||||
, axis_text_size = axis_text_size
|
||||
, axis_label_size = axis_label_size)
|
||||
posC_nca
|
||||
}
|
||||
#===============================================================
|
||||
#------------------------------
|
||||
# bp site site count: ALL
|
||||
# <10 Ang ligand
|
||||
#------------------------------
|
||||
posC_all = site_snp_count_bp(plotdf = df3
|
||||
, df_colname = "position"
|
||||
, xaxis_title = "Number of nsSNPs"
|
||||
, yaxis_title = "Number of Sites"
|
||||
, subtitle_colour = "chocolate4"
|
||||
, subtitle_text = "All mutations sites"
|
||||
, subtitle_size = subtitle_size
|
||||
, geom_ls = geom_ls_pc
|
||||
, leg_text_size = leg_text_size
|
||||
, axis_text_size = axis_text_size
|
||||
, axis_label_size = axis_label_size)
|
||||
posC_all
|
||||
##################################################################
|
||||
consurfP = stability_count_bp(plotdf = df3
|
||||
, df_colname = "consurf_outcome"
|
||||
#, leg_title = "ConSurf"
|
||||
#, label_categories = labels_consurf
|
||||
, yaxis_title = "Number of nsSNPs"
|
||||
, leg_position = "top"
|
||||
, subtitle_text = "ConSurf"
|
||||
, bar_fill_values = consurf_colours # from globals
|
||||
, subtitle_colour= "black"
|
||||
, sts = sts
|
||||
, lts = lts
|
||||
, ats = ats
|
||||
, als = als
|
||||
, ltis = ltis
|
||||
, geom_ls = geom_ls)
|
||||
|
||||
consurfP
|
||||
|
||||
##############################################################
|
||||
sts_so = 10
|
||||
lts_so = 10
|
||||
ats_so = 10
|
||||
als_so = 10
|
||||
ltis_so = 10
|
||||
geom_ls_so = 2.5
|
||||
#===================
|
||||
# Stability
|
||||
#===================
|
||||
# duetP
|
||||
duetP = stability_count_bp(plotdf = df3
|
||||
, df_colname = "duet_outcome"
|
||||
, leg_title = "mCSM-DUET"
|
||||
#, label_categories = labels_duet
|
||||
, yaxis_title = "Number of nsSNPs"
|
||||
, leg_position = "none"
|
||||
, subtitle_text = "mCSM-DUET"
|
||||
, bar_fill_values = c("#F8766D", "#00BFC4")
|
||||
, subtitle_colour= "black"
|
||||
, sts = sts_so
|
||||
, lts = lts_so
|
||||
, ats = ats_so
|
||||
, als = als_so
|
||||
, ltis = ltis_so
|
||||
, geom_ls = geom_ls_so)
|
||||
duetP
|
||||
|
||||
# foldx
|
||||
foldxP = stability_count_bp(plotdf = df3
|
||||
, df_colname = "foldx_outcome"
|
||||
#, leg_title = "FoldX"
|
||||
#, label_categories = labels_foldx
|
||||
, yaxis_title = ""
|
||||
, leg_position = "none"
|
||||
, subtitle_text = "FoldX"
|
||||
, bar_fill_values = c("#F8766D", "#00BFC4")
|
||||
, sts = sts_so
|
||||
, lts = lts_so
|
||||
, ats = ats_so
|
||||
, als = als_so
|
||||
, ltis = ltis_so
|
||||
, geom_ls = geom_ls_so)
|
||||
foldxP
|
||||
|
||||
# deepddg
|
||||
deepddgP = stability_count_bp(plotdf = df3
|
||||
, df_colname = "deepddg_outcome"
|
||||
#, leg_title = "DeepDDG"
|
||||
#, label_categories = labels_deepddg
|
||||
, yaxis_title = ""
|
||||
, leg_position = "none"
|
||||
, subtitle_text = "DeepDDG"
|
||||
, bar_fill_values = c("#F8766D", "#00BFC4")
|
||||
, sts = sts_so
|
||||
, lts = lts_so
|
||||
, ats = ats_so
|
||||
, als = als_so
|
||||
, ltis = ltis_so
|
||||
, geom_ls = geom_ls_so)
|
||||
deepddgP
|
||||
|
||||
# deepddg
|
||||
dynamut2P = stability_count_bp(plotdf = df3
|
||||
, df_colname = "ddg_dynamut2_outcome"
|
||||
#, leg_title = "Dynamut2"
|
||||
#, label_categories = labels_ddg_dynamut2_outcome
|
||||
, yaxis_title = ""
|
||||
, leg_position = "none"
|
||||
, subtitle_text = "Dynamut2"
|
||||
, bar_fill_values = c("#F8766D", "#00BFC4")
|
||||
, sts = sts_so
|
||||
, lts = lts_so
|
||||
, ats = ats_so
|
||||
, als = als_so
|
||||
, ltis = ltis_so
|
||||
, geom_ls = geom_ls_so)
|
||||
dynamut2P
|
||||
|
||||
# provean
|
||||
proveanP = stability_count_bp(plotdf = df3
|
||||
, df_colname = "provean_outcome"
|
||||
#, leg_title = "PROVEAN"
|
||||
#, label_categories = labels_provean
|
||||
, yaxis_title = "Number of nsSNPs"
|
||||
, leg_position = "none" # top
|
||||
, subtitle_text = "PROVEAN"
|
||||
, bar_fill_values = c("#D01C8B", "#F1B6DA") # light pink and deep
|
||||
, sts = sts_so
|
||||
, lts = lts_so
|
||||
, ats = ats_so
|
||||
, als = als_so
|
||||
, ltis = ltis_so
|
||||
, geom_ls = geom_ls_so)
|
||||
proveanP
|
||||
|
||||
# snap2
|
||||
snap2P = stability_count_bp(plotdf = df3
|
||||
, df_colname = "snap2_outcome"
|
||||
#, leg_title = "SNAP2"
|
||||
#, label_categories = labels_snap2
|
||||
, yaxis_title = ""
|
||||
, leg_position = "none" # top
|
||||
, subtitle_text = "SNAP2"
|
||||
, bar_fill_values = c("#D01C8B", "#F1B6DA") # light pink and deep
|
||||
, sts = sts_so
|
||||
, lts = lts_so
|
||||
, ats = ats_so
|
||||
, als = als_so
|
||||
, ltis = ltis_so
|
||||
, geom_ls = geom_ls_so)
|
||||
snap2P
|
||||
#####################################################################################
|
|
@ -1,17 +1,38 @@
|
|||
duetP
|
||||
foldxP
|
||||
deepddgP
|
||||
dynamut2P
|
||||
proveanP
|
||||
snap2P
|
||||
#=============
|
||||
# Data: Input
|
||||
#==============
|
||||
source("~/git/LSHTM_analysis/config/gid.R")
|
||||
source("~/git/LSHTM_analysis/scripts/plotting/get_plotting_dfs.R")
|
||||
#cat("\nSourced plotting cols as well:", length(plotting_cols))
|
||||
|
||||
source("/home/tanu/git/LSHTM_analysis/scripts/plotting/plotting_thesis/gid/basic_barplots_gid.R")
|
||||
source("/home/tanu/git/LSHTM_analysis/scripts/plotting/plotting_thesis/gid/pe_sens_site_count_gid.R")
|
||||
|
||||
|
||||
if ( tolower(gene)%in%c("gid") ){
|
||||
cat("\nPlots available for layout are:")
|
||||
|
||||
duetP
|
||||
foldxP
|
||||
deepddgP
|
||||
dynamut2P
|
||||
proveanP
|
||||
snap2P
|
||||
|
||||
mLigP
|
||||
mmLigP
|
||||
posC_lig
|
||||
|
||||
nca_distP
|
||||
posC_nca
|
||||
|
||||
peP2
|
||||
sens_siteP
|
||||
peP # not used
|
||||
sensP # not used
|
||||
}
|
||||
|
||||
|
||||
mLigP
|
||||
mmLigP
|
||||
posC_lig
|
||||
ppi2P
|
||||
posC_nca
|
||||
peP
|
||||
sensP
|
||||
#========================
|
||||
# Common title settings
|
||||
#=========================
|
||||
|
@ -118,9 +139,8 @@ dev.off()
|
|||
|
||||
#################################################################
|
||||
#=======================================
|
||||
# Affinity barplots: COMBINE ALL three
|
||||
# Affinity barplots: COMBINE ALL four
|
||||
#========================================
|
||||
|
||||
ligT = paste0(common_bp_title, " ligand")
|
||||
lig_affT = ggdraw() +
|
||||
draw_label(
|
||||
|
@ -136,7 +156,7 @@ p1 = cowplot::plot_grid(cowplot::plot_grid(lig_affT
|
|||
, nrow=2),
|
||||
cowplot::plot_grid(mLigP, mmLigP, posC_lig
|
||||
, nrow = 1
|
||||
, rel_widths = c(1,1,1.8)
|
||||
, rel_widths = c(1,0.65,1.8)
|
||||
, align = "h"),
|
||||
nrow = 2,
|
||||
rel_heights = c(1,8)
|
||||
|
@ -144,7 +164,7 @@ p1 = cowplot::plot_grid(cowplot::plot_grid(lig_affT
|
|||
)
|
||||
p1
|
||||
###########################################################
|
||||
ncaT = paste0(common_bp_title, " Dist-NA")
|
||||
ncaT = paste0(common_bp_title, " Nucleic Acid")
|
||||
nca_affT = ggdraw() +
|
||||
draw_label(
|
||||
ncaT,
|
||||
|
@ -159,7 +179,7 @@ p2 = cowplot::plot_grid(cowplot::plot_grid(nca_affT
|
|||
, nrow=2),
|
||||
cowplot::plot_grid(nca_distP, posC_nca
|
||||
, nrow = 1
|
||||
, rel_widths = c(1.2,1.8)
|
||||
, rel_widths = c(1,1.8)
|
||||
, align = "h"),
|
||||
nrow = 2,
|
||||
rel_heights = c(1,8)
|
||||
|
@ -176,7 +196,7 @@ peT_allT = ggdraw() +
|
|||
size = 8
|
||||
)
|
||||
|
||||
p3 = cowplot::plot_grid(cowplot::plot_grid(peT_allT, nrow = 2
|
||||
p4 = cowplot::plot_grid(cowplot::plot_grid(peT_allT, nrow = 2
|
||||
, rel_widths = c(1,3),axis = "lr"),
|
||||
cowplot::plot_grid(
|
||||
peP2, posC_all,
|
||||
|
@ -185,13 +205,12 @@ p3 = cowplot::plot_grid(cowplot::plot_grid(peT_allT, nrow = 2
|
|||
align = "v",
|
||||
axis = "lr",
|
||||
rel_heights = c(1,8)
|
||||
),
|
||||
),
|
||||
rel_heights = c(1,18),
|
||||
nrow = 2,axis = "lr")
|
||||
p3
|
||||
#===============
|
||||
# Final combine
|
||||
#===============
|
||||
p4
|
||||
|
||||
#### Combine p1+p2+p4 ####
|
||||
w = 11.79
|
||||
h = 3.5
|
||||
mut_impact_CLP = paste0(outdir_images
|
||||
|
@ -202,21 +221,46 @@ mut_impact_CLP = paste0(outdir_images
|
|||
print(paste0("plot filename:", mut_impact_CLP))
|
||||
png(mut_impact_CLP, units = "in", width = w, height = h, res = 300 )
|
||||
|
||||
cowplot::plot_grid(p1, p2
|
||||
#, p3
|
||||
, nrow = 1
|
||||
, labels = "AUTO"
|
||||
, label_size = 12
|
||||
, rel_widths = c(3,2,2)
|
||||
cowplot::plot_grid(p1,
|
||||
p2,
|
||||
p4,
|
||||
nrow = 1,
|
||||
labels = "AUTO",
|
||||
label_size = 12,
|
||||
rel_widths = c(2.5,2,2)
|
||||
#, rel_heights = c(1)
|
||||
)
|
||||
)
|
||||
|
||||
dev.off()
|
||||
w = 11.79
|
||||
h = 3.5
|
||||
mut_impact_CLP = paste0(outdir_images
|
||||
,tolower(gene)
|
||||
,"_mut_impactCLP.png")
|
||||
|
||||
#svg(affP, width = 20, height = 5.5)
|
||||
print(paste0("plot filename:", mut_impact_CLP))
|
||||
png(mut_impact_CLP, units = "in", width = w, height = h, res = 300 )
|
||||
|
||||
cowplot::plot_grid(p1,
|
||||
p2,
|
||||
p4,
|
||||
nrow = 1,
|
||||
labels = "AUTO",
|
||||
label_size = 12,
|
||||
rel_widths = c(2.5,2,2)
|
||||
#, rel_heights = c(1)
|
||||
)
|
||||
|
||||
dev.off()
|
||||
|
||||
|
||||
|
||||
##################################################
|
||||
sensP
|
||||
consurfP
|
||||
#=================
|
||||
# Combine sensitivity + ConSurf
|
||||
#### Combine sensitivity + ConSurf ####
|
||||
# or ConSurf
|
||||
#=================
|
||||
w = 3
|
||||
|
@ -263,7 +307,7 @@ sens_siteCLP = paste0(outdir_images
|
|||
,"_sens_siteC_tile.png")
|
||||
|
||||
print(paste0("plot filename:", sens_siteCLP))
|
||||
png(sens_siteCLP, units = "in", width = 1, height = 1, res = 300 )
|
||||
png(sens_siteCLP, units = "in", width = 1.2, height = 1, res = 300 )
|
||||
sens_siteP
|
||||
dev.off()
|
||||
|
|
@ -1,320 +0,0 @@
|
|||
#################
|
||||
# Numbers
|
||||
##################
|
||||
#all_dm_om_df = dm_om_wf_lf_data(df = merged_df3, gene = gene)
|
||||
all_dm_om_df = dm_om_wf_lf_data(df = df3, gene = gene)
|
||||
|
||||
# lf_duet = all_dm_om_df[['lf_duet']]
|
||||
# table(lf_duet$param_type)
|
||||
################################################################
|
||||
|
||||
#======================
|
||||
# Data: Dist+Genomics
|
||||
#======================
|
||||
lf_dist_genP = all_dm_om_df[['lf_dist_gen']]
|
||||
wf_dist_genP = all_dm_om_df[['wf_dist_gen']]
|
||||
|
||||
levels(lf_dist_genP$param_type)
|
||||
#lf_dist_genP$param_type <- factor(lf_dist_genP$param_type, levels=c("Log10(MAF)", "Lig Dist(Å)", "PPI Dist(Å)"))
|
||||
table(lf_dist_genP$param_type)
|
||||
|
||||
genomics_param = c("Log10(MAF)")
|
||||
|
||||
dist_genP = lf_bp2(lf_dist_genP
|
||||
#, p_title
|
||||
, violin_quantiles = c(0.5), monochrome = F)
|
||||
dist_genP
|
||||
#-------------------
|
||||
# Genomics data plot
|
||||
#-------------------
|
||||
genomics_dataP = lf_dist_genP[lf_dist_genP$param_type%in%genomics_param,]
|
||||
genomics_dataP$param_type = factor(genomics_dataP$param_type)
|
||||
table(genomics_dataP$param_type)
|
||||
|
||||
genomicsP = lf_bp2(genomics_dataP
|
||||
#, p_title = ""
|
||||
, violin_quantiles = c(0.5), monochrome = F)
|
||||
|
||||
genomicsP
|
||||
|
||||
#check
|
||||
wilcox.test(wf_dist_genP$`Log10(MAF)`[wf_dist_genP$mutation_info_labels=="R"]
|
||||
, wf_dist_genP$`Log10(MAF)`[wf_dist_genP$mutation_info_labels=="S"], paired = FALSE)
|
||||
|
||||
tapply(wf_dist_genP$`Log10(MAF)`, wf_dist_genP$mutation_info_labels, summary)
|
||||
|
||||
#-------------------
|
||||
# Distance data plot:
|
||||
#--------------------
|
||||
# not genomics
|
||||
dist_dataP = lf_dist_genP[!lf_dist_genP$param_type%in%genomics_param,]
|
||||
dist_dataP$param_type = factor(dist_dataP$param_type)
|
||||
table(dist_dataP$param_type)
|
||||
levels(dist_dataP$param_type)
|
||||
# relevel factor to control ordering of appearance of plot
|
||||
dist_dataP$param_type <-relevel(dist_dataP$param_type, "Lig Dist(Å)" )
|
||||
table(dist_dataP$param_type)
|
||||
levels(dist_dataP$param_type)
|
||||
|
||||
distanceP = lf_bp2(dist_dataP
|
||||
#, p_title = ""
|
||||
, violin_quantiles = c(0.5), monochrome = F)
|
||||
|
||||
distanceP
|
||||
|
||||
# check
|
||||
wilcox.test(wf_dist_genP$`PPI Dist(Å)`[wf_dist_genP$mutation_info_labels=="R"]
|
||||
, wf_dist_genP$`PPI Dist(Å)`[wf_dist_genP$mutation_info_labels=="S"], paired = FALSE)
|
||||
|
||||
wilcox.test(wf_dist_genP$`Lig Dist(Å)`[wf_dist_genP$mutation_info_labels=="R"]
|
||||
, wf_dist_genP$`Lig Dist(Å)`[wf_dist_genP$mutation_info_labels=="S"], paired = FALSE)
|
||||
|
||||
|
||||
wilcox.test(wf_dist_genP$`NA Dist(Å)`[wf_dist_genP$mutation_info_labels=="R"]
|
||||
, wf_dist_genP$`NA Dist(Å)`[wf_dist_genP$mutation_info_labels=="S"], paired = FALSE)
|
||||
|
||||
tapply(wf_dist_genP$`PPI Dist(Å)`, wf_dist_genP$mutation_info_labels, summary)
|
||||
|
||||
tapply(wf_dist_genP$`Lig Dist(Å)`, wf_dist_genP$mutation_info_labels, summary)
|
||||
|
||||
|
||||
#-------------------
|
||||
# Distance data plot: LigDist
|
||||
#--------------------
|
||||
levels(dist_dataP$param_type)[[1]]
|
||||
#Lig Dist(Å), PPI Dist(Å)
|
||||
dist_data_lig = dist_dataP[dist_dataP$param_type%in%c(levels(dist_dataP$param_type)[[1]]),]
|
||||
dist_data_lig$param_type = factor(dist_data_lig$param_type)
|
||||
table(dist_data_lig$param_type)
|
||||
levels(dist_data_lig$param_type)
|
||||
distanceP_lig = lf_bp2(dist_data_lig
|
||||
#, p_title = ""
|
||||
, violin_quantiles = c(0.5), monochrome = F)
|
||||
|
||||
distanceP_lig
|
||||
|
||||
if (tolower(gene)%in%geneL_ppi2){
|
||||
#-------------------
|
||||
# Distance data plot: LigDist
|
||||
#--------------------
|
||||
levels(dist_dataP$param_type)[[2]]
|
||||
#Lig Dist(Å), PPI Dist(Å)
|
||||
dist_data_ppi2 = dist_dataP[dist_dataP$param_type%in%c(levels(dist_dataP$param_type)[[2]]),]
|
||||
dist_data_ppi2$param_type = factor(dist_data_ppi2$param_type)
|
||||
table(dist_data_ppi2$param_type)
|
||||
levels(dist_data_ppi2$param_type)
|
||||
distanceP_ppi2 = lf_bp2(dist_data_ppi2
|
||||
#, p_title = ""
|
||||
, violin_quantiles = c(0.5), monochrome = F)
|
||||
|
||||
distanceP_ppi2
|
||||
}
|
||||
|
||||
if (tolower(gene)%in%geneL_na){
|
||||
#-------------------
|
||||
# Distance data plot: NADist
|
||||
#--------------------
|
||||
levels(dist_dataP$param_type)[[2]]
|
||||
#Lig Dist(Å), PPI Dist(Å)
|
||||
dist_data_na = dist_dataP[dist_dataP$param_type%in%c(levels(dist_dataP$param_type)[[2]]),]
|
||||
dist_data_na$param_type = factor(dist_data_na$param_type)
|
||||
table(dist_data_na$param_type)
|
||||
levels(dist_data_na$param_type)
|
||||
distanceP_na = lf_bp2(dist_data_na
|
||||
#, p_title = ""
|
||||
, violin_quantiles = c(0.5), monochrome = F)
|
||||
|
||||
distanceP_na
|
||||
}
|
||||
#==============
|
||||
# Plot:DUET
|
||||
#==============
|
||||
lf_duetP = all_dm_om_df[['lf_duet']]
|
||||
#lf_duetP = lf_duet[!lf_duet$param_type%in%c(static_colsP),]
|
||||
table(lf_duetP$param_type)
|
||||
lf_duetP$param_type = factor(lf_duetP$param_type)
|
||||
table(lf_duetP$param_type)
|
||||
|
||||
duetP = lf_bp2(lf_duetP
|
||||
#, p_title = ""
|
||||
, violin_quantiles = c(0.5), monochrome = F
|
||||
, dot_transparency = 0.2)
|
||||
|
||||
#==============
|
||||
# Plot:FoldX
|
||||
#==============
|
||||
lf_foldxP = all_dm_om_df[['lf_foldx']]
|
||||
#lf_foldxP = lf_foldx[!lf_foldx$param_type%in%c(static_colsP),]
|
||||
table(lf_foldxP$param_type)
|
||||
lf_foldxP$param_type = factor(lf_foldxP$param_type)
|
||||
table(lf_foldxP$param_type)
|
||||
|
||||
foldxP = lf_bp2(lf_foldxP
|
||||
#, p_title = ""
|
||||
, violin_quantiles = c(0.5), monochrome = F
|
||||
, dot_transparency = 0.1)
|
||||
|
||||
#==============
|
||||
# Plot:DeepDDG
|
||||
#==============
|
||||
lf_deepddgP = all_dm_om_df[['lf_deepddg']]
|
||||
#lf_deepddgP = lf_deepddg[!lf_deepddg$param_type%in%c(static_colsP),]
|
||||
table(lf_deepddgP$param_type)
|
||||
lf_deepddgP$param_type = factor(lf_deepddgP$param_type)
|
||||
table(lf_deepddgP$param_type)
|
||||
|
||||
deepddgP = lf_bp2(lf_deepddgP
|
||||
#, p_title = ""
|
||||
, violin_quantiles = c(0.5), monochrome = F
|
||||
, dot_transparency = 0.2)
|
||||
|
||||
deepddgP
|
||||
|
||||
#==============
|
||||
# Plot: Dynamut2
|
||||
#==============
|
||||
lf_dynamut2P = all_dm_om_df[['lf_dynamut2']]
|
||||
#lf_dynamut2P = lf_dynamut2[!lf_dynamut2$param_type%in%c(static_colsP),]
|
||||
table(lf_dynamut2P$param_type)
|
||||
lf_dynamut2P$param_type = factor(lf_dynamut2P$param_type)
|
||||
table(lf_dynamut2P$param_type)
|
||||
|
||||
dynamut2P = lf_bp2(lf_dynamut2P
|
||||
#, p_title = ""
|
||||
, violin_quantiles = c(0.5), monochrome = F
|
||||
, dot_transparency = 0.2)
|
||||
|
||||
|
||||
#==============
|
||||
# Plot:ConSurf
|
||||
#==============
|
||||
lf_consurfP = all_dm_om_df[['lf_consurf']]
|
||||
#lf_consurfP = lf_consurf[!lf_consurf$param_type%in%c(static_colsP),]
|
||||
table(lf_consurfP$param_type)
|
||||
lf_consurfP$param_type = factor(lf_consurfP$param_type)
|
||||
table(lf_consurfP$param_type)
|
||||
|
||||
consurfP = lf_bp2(lf_consurfP
|
||||
#, p_title = ""
|
||||
, violin_quantiles = c(0.5), monochrome = F)
|
||||
|
||||
#==============
|
||||
# Plot:PROVEAN
|
||||
#==============
|
||||
lf_proveanP = all_dm_om_df[['lf_provean']]
|
||||
#lf_proveanP = lf_provean[!lf_provean$param_type%in%c(static_colsP),]
|
||||
table(lf_proveanP$param_type)
|
||||
lf_proveanP$param_type = factor(lf_proveanP$param_type)
|
||||
table(lf_proveanP$param_type)
|
||||
|
||||
proveanP = lf_bp2(lf_proveanP
|
||||
#, p_title = ""
|
||||
, violin_quantiles = c(0.5), monochrome = F)
|
||||
|
||||
#==============
|
||||
# Plot:SNAP2
|
||||
#==============
|
||||
lf_snap2P = all_dm_om_df[['lf_snap2']]
|
||||
#lf_snap2P = lf_snap2[!lf_snap2$param_type%in%c(static_colsP),]
|
||||
table(lf_snap2P$param_type)
|
||||
lf_snap2P$param_type = factor(lf_snap2P$param_type)
|
||||
table(lf_snap2P$param_type)
|
||||
|
||||
snap2P = lf_bp2(lf_snap2P
|
||||
#, p_title = ""
|
||||
, violin_quantiles = c(0.5), monochrome = F)
|
||||
|
||||
|
||||
############################################################################
|
||||
#================
|
||||
# Plot: mCSM-lig
|
||||
#================
|
||||
lf_mcsm_ligP = all_dm_om_df[['lf_mcsm_lig']]
|
||||
#lf_mcsm_ligP = lf_mcsm_lig[!lf_mcsm_lig$param_type%in%c(static_colsP),]
|
||||
table(lf_mcsm_ligP$param_type)
|
||||
lf_mcsm_ligP$param_type = factor(lf_mcsm_ligP$param_type)
|
||||
table(lf_mcsm_ligP$param_type)
|
||||
|
||||
mcsmligP = lf_bp2(lf_mcsm_ligP
|
||||
#, p_title = ""
|
||||
, violin_quantiles = c(0.5), monochrome = F
|
||||
, dot_transparency = 1)
|
||||
|
||||
|
||||
#=================
|
||||
# Plot: mmCSM-lig2
|
||||
#=================
|
||||
lf_mmcsm_lig2P = all_dm_om_df[['lf_mmcsm_lig2']]
|
||||
#lf_mmcsm_lig2P = lf_mmcsm_lig2P[!lf_mmcsm_lig2P$param_type%in%c(static_colsP),]
|
||||
table(lf_mmcsm_lig2P$param_type)
|
||||
lf_mmcsm_lig2P$param_type = factor(lf_mmcsm_lig2P$param_type)
|
||||
table(lf_mmcsm_lig2P$param_type)
|
||||
|
||||
mcsmlig2P = lf_bp2(lf_mmcsm_lig2P
|
||||
#, p_title = ""
|
||||
, violin_quantiles = c(0.5), monochrome = F
|
||||
, dot_transparency = 1)
|
||||
|
||||
mcsmlig2P
|
||||
|
||||
#================
|
||||
# Plot: mCSM-ppi2
|
||||
#================
|
||||
if (tolower(gene)%in%geneL_ppi2){
|
||||
lf_mcsm_ppi2P = all_dm_om_df[['lf_mcsm_ppi2']]
|
||||
#lf_mcsm_ppi2P = lf_mcsm_ppi2[!lf_mcsm_ppi2$param_type%in%c(static_colsP),]
|
||||
table(lf_mcsm_ppi2P$param_type)
|
||||
lf_mcsm_ppi2P$param_type = factor(lf_mcsm_ppi2P$param_type)
|
||||
table(lf_mcsm_ppi2P$param_type)
|
||||
|
||||
mcsmppi2P = lf_bp2(lf_mcsm_ppi2P
|
||||
#, p_title = ""
|
||||
, violin_quantiles = c(0.5), monochrome = F
|
||||
, dot_transparency = 1)
|
||||
|
||||
}
|
||||
|
||||
#==============
|
||||
# Plot: mCSM-NA
|
||||
#==============
|
||||
if (tolower(gene)%in%geneL_na){
|
||||
lf_mcsm_naP = all_dm_om_df[['lf_mcsm_na']]
|
||||
#lf_mcsm_naP = lf_mcsm_na[!lf_mcsm_na$param_type%in%c(static_colsP),]
|
||||
table(lf_mcsm_naP$param_type)
|
||||
lf_mcsm_naP$param_type = factor(lf_mcsm_naP$param_type)
|
||||
table(lf_mcsm_naP$param_type)
|
||||
|
||||
mcsmnaP = lf_bp2(lf_mcsm_naP
|
||||
#, p_title = ""
|
||||
, violin_quantiles = c(0.5), monochrome = F
|
||||
, dot_transparency = 1)
|
||||
|
||||
}
|
||||
|
||||
######################################
|
||||
# Outplot with stats
|
||||
######################################
|
||||
# outdir_images = paste0("~/git/Writing/thesis/images/results/", tolower(gene), "/")
|
||||
#
|
||||
# dm_om_combinedP = paste0(outdir_images
|
||||
# ,tolower(gene)
|
||||
# ,"_dm_om_all.svg" )
|
||||
#
|
||||
# cat("DM OM plots with stats:", dm_om_combinedP)
|
||||
# svg(dm_om_combinedP, width = 32, height = 18)
|
||||
# cowplot::plot_grid(
|
||||
# cowplot::plot_grid(duetP, foldxP, deepddgP, dynamut2P, genomicsP, distanceP
|
||||
# , nrow=1
|
||||
# , rel_widths = c(1/7, 1/7,1/7,1/7, 1/7, 1.75/7)),
|
||||
# #, rel_widths = c(1/8, 1/8,1/8,1/8, 1/8, 2.75/8)), # for 3 distances
|
||||
# cowplot::plot_grid(consurfP, proveanP, snap2P
|
||||
# , mcsmligP
|
||||
# , mcsmlig2P
|
||||
# , mcsmppi2P
|
||||
# #, mcsmnaP
|
||||
# , nrow=1),
|
||||
# nrow=2)
|
||||
#
|
||||
# dev.off()
|
||||
|
||||
|
176
scripts/plotting/plotting_thesis/gid/dm_om_plots_gid_ayout.R
Normal file
176
scripts/plotting/plotting_thesis/gid/dm_om_plots_gid_ayout.R
Normal file
|
@ -0,0 +1,176 @@
|
|||
# source dm_om_plots.R
|
||||
source("/home/tanu/git/LSHTM_analysis/scripts/plotting/plotting_thesis/dm_om_plots.R")
|
||||
|
||||
##### plots to combine ####
|
||||
duetP
|
||||
foldxP
|
||||
deepddgP
|
||||
dynamut2P
|
||||
genomicsP
|
||||
consurfP
|
||||
proveanP
|
||||
snap2P
|
||||
mcsmligP
|
||||
mcsmlig2P
|
||||
mcsmnaP
|
||||
|
||||
# Plot labels
|
||||
tit1 = "Stability changes"
|
||||
tit2 = "Genomic measure"
|
||||
tit3 = "Distance to partners"
|
||||
tit4 = "Evolutionary Conservation"
|
||||
tit5 = "Affinity changes"
|
||||
pt_size = 30
|
||||
|
||||
theme_georgia <- function(...) {
|
||||
theme_gray(base_family = "sans", ...) +
|
||||
theme(plot.title = element_text(face = "bold"))
|
||||
}
|
||||
|
||||
|
||||
title_theme <- calc_element("plot.title", theme_georgia())
|
||||
|
||||
pt1 = ggdraw() +
|
||||
draw_label(
|
||||
tit1,
|
||||
fontfamily = title_theme$family,
|
||||
fontface = title_theme$face,
|
||||
#size = title_theme$size
|
||||
size = pt_size
|
||||
)
|
||||
|
||||
pt2 = ggdraw() +
|
||||
draw_label(
|
||||
tit2,
|
||||
fontfamily = title_theme$family,
|
||||
fontface = title_theme$face,
|
||||
size = pt_size
|
||||
)
|
||||
|
||||
pt3 = ggdraw() +
|
||||
draw_label(
|
||||
tit3,
|
||||
fontfamily = title_theme$family,
|
||||
fontface = title_theme$face,
|
||||
size = pt_size
|
||||
)
|
||||
|
||||
pt4 = ggdraw() +
|
||||
draw_label(
|
||||
tit4,
|
||||
fontfamily = title_theme$family,
|
||||
fontface = title_theme$face,
|
||||
size = pt_size
|
||||
)
|
||||
|
||||
|
||||
pt5 = ggdraw() +
|
||||
draw_label(
|
||||
tit5,
|
||||
fontfamily = title_theme$family,
|
||||
fontface = title_theme$face,
|
||||
size = pt_size
|
||||
)
|
||||
|
||||
#======================
|
||||
# Output plot function
|
||||
#======================
|
||||
OutPlot_dm_om = function(x){
|
||||
|
||||
# dist b/w plot title and plot
|
||||
relH_tp = c(0.08, 0.92)
|
||||
|
||||
my_label_size = 25
|
||||
#----------------
|
||||
# Top panel
|
||||
#----------------
|
||||
top_panel = cowplot::plot_grid(
|
||||
cowplot::plot_grid(pt1,
|
||||
cowplot::plot_grid(duetP, foldxP, deepddgP, dynamut2P
|
||||
, nrow = 1
|
||||
, labels = c("A", "B", "C", "D")
|
||||
, label_size = my_label_size)
|
||||
, ncol = 1
|
||||
, rel_heights = relH_tp
|
||||
),
|
||||
NULL,
|
||||
cowplot::plot_grid(pt2,
|
||||
cowplot::plot_grid(genomicsP
|
||||
, nrow = 1
|
||||
, labels = c("E")
|
||||
, label_size = my_label_size)
|
||||
, ncol = 1
|
||||
, rel_heights = relH_tp
|
||||
),
|
||||
NULL,
|
||||
cowplot::plot_grid(pt3,
|
||||
cowplot::plot_grid( #distanceP
|
||||
distanceP_lig
|
||||
, distanceP_na
|
||||
, nrow = 1
|
||||
, labels = c("F", "G")
|
||||
, label_size = my_label_size)
|
||||
, ncol = 1
|
||||
, rel_heights = relH_tp
|
||||
),
|
||||
nrow = 1,
|
||||
rel_widths = c(2/7, 0.1/7, 0.5/7, 0.1/7, 1/7)
|
||||
)
|
||||
|
||||
#----------------
|
||||
# Bottom panel
|
||||
#----------------
|
||||
bottom_panel = cowplot::plot_grid(
|
||||
cowplot::plot_grid(pt4,
|
||||
cowplot::plot_grid(consurfP, proveanP, snap2P
|
||||
, nrow = 1
|
||||
, labels = c("H", "I", "J")
|
||||
, label_size = my_label_size)
|
||||
, ncol = 1
|
||||
, rel_heights =relH_tp
|
||||
),NULL,
|
||||
cowplot::plot_grid(pt5,
|
||||
cowplot::plot_grid(mcsmligP
|
||||
, mcsmlig2P
|
||||
, mcsmnaP
|
||||
, nrow = 1
|
||||
, labels = c("K", "L", "M")
|
||||
, label_size = my_label_size)
|
||||
, ncol = 1
|
||||
, rel_heights = relH_tp
|
||||
),NULL,
|
||||
nrow = 1,
|
||||
rel_widths = c(3/6,0.1/6,3/6, 0.1/6 )
|
||||
)
|
||||
|
||||
#-------------------------------
|
||||
# combine: Top and Bottom panel
|
||||
#-------------------------------
|
||||
cowplot::plot_grid (top_panel, bottom_panel
|
||||
, nrow =2
|
||||
, rel_widths = c(1, 1)
|
||||
, align = "hv")
|
||||
}
|
||||
|
||||
#=====================
|
||||
# OutPlot: svg and png
|
||||
#======================
|
||||
dm_om_combinedP = paste0(outdir_images
|
||||
,tolower(gene)
|
||||
,"_dm_om_all.svg")
|
||||
|
||||
cat("DM OM plots with stats:", dm_om_combinedP)
|
||||
svg(dm_om_combinedP, width = 32, height = 18)
|
||||
|
||||
OutPlot_dm_om()
|
||||
dev.off()
|
||||
|
||||
|
||||
dm_om_combinedP_png = paste0(outdir_images
|
||||
,tolower(gene)
|
||||
,"_dm_om_all.png")
|
||||
cat("DM OM plots with stats:", dm_om_combinedP_png)
|
||||
png(dm_om_combinedP_png, width = 32, height = 18, units = "in", res = 300)
|
||||
|
||||
OutPlot_dm_om()
|
||||
dev.off()
|
|
@ -14,9 +14,8 @@ my_gg_pairs=function(plot_df, plot_title
|
|||
title="ρ",
|
||||
digits=2,
|
||||
justify_labels = "centre",
|
||||
#title_args=c(colour="black"),
|
||||
title_args=c(size=tt_args_size),#2.5
|
||||
group_args=c(size=gp_args_size)#2.5
|
||||
title_args=list(size=tt_args_size, colour="black"),#2.5
|
||||
group_args=list(size=gp_args_size)#2.5
|
||||
)
|
||||
),
|
||||
lower = list(
|
||||
|
@ -73,7 +72,7 @@ if (tolower(gene)%in%geneL_ppi2){
|
|||
}
|
||||
|
||||
if (tolower(gene)%in%geneL_na){
|
||||
corr_affinity_df[corr_affinity_df["NCA-Dist"]>DistCutOff,"mCSM-NA"]=0
|
||||
corr_affinity_df[corr_affinity_df["NA-Dist"]>DistCutOff,"mCSM-NA"]=0
|
||||
}
|
||||
|
||||
# count 0
|
||||
|
@ -97,6 +96,7 @@ corr_df_ps = corr_plotdf[, corr_ps_colnames]
|
|||
|
||||
# Plot #1
|
||||
plot_corr_df_ps = my_gg_pairs(corr_df_ps, plot_title="Stability estimates")
|
||||
|
||||
##########################################################
|
||||
#================
|
||||
# Conservation
|
||||
|
@ -142,37 +142,62 @@ corr_df_aff = corr_affinity_df[, corr_aff_colnames]
|
|||
colnames(corr_df_aff)
|
||||
|
||||
# Plot #3
|
||||
plot_corr_df_aff = my_gg_pairs(corr_df_aff,
|
||||
plot_title="Affinity estimates",
|
||||
tt_args_size = 4,
|
||||
gp_args_size = 4)
|
||||
plot_corr_df_aff = my_gg_pairs(corr_df_aff
|
||||
, plot_title="Affinity estimates"
|
||||
#, tt_args_size = 4
|
||||
#, gp_args_size = 4
|
||||
)
|
||||
|
||||
#=============
|
||||
# combine
|
||||
#=============
|
||||
#### Combine plots #####
|
||||
# #png("/home/tanu/tmp/gg_pairs_all.png", height = 6, width=11.75, unit="in",res=300)
|
||||
# png(paste0(outdir_images
|
||||
# ,tolower(gene)
|
||||
# ,"_CorrAB.png"), height = 6, width=11.75, unit="in",res=300)
|
||||
#
|
||||
# cowplot::plot_grid(ggmatrix_gtable(plot_corr_df_ps),
|
||||
# ggmatrix_gtable(plot_corr_df_cons),
|
||||
# # ggmatrix_gtable(plot_corr_df_aff),
|
||||
# # nrow=1, ncol=3, rel_heights = 7,7,3
|
||||
# nrow=1,
|
||||
# #rel_heights = 1,1
|
||||
# labels = "AUTO",
|
||||
# label_size = 12)
|
||||
# dev.off()
|
||||
#
|
||||
# # affinity corr
|
||||
# #png("/home/tanu/tmp/gg_pairs_affinity.png", height =7, width=7, unit="in",res=300)
|
||||
# png(paste0(outdir_images
|
||||
# ,tolower(gene)
|
||||
# ,"_CorrC.png"), height =7, width=7, unit="in",res=300)
|
||||
#
|
||||
# cowplot::plot_grid(ggmatrix_gtable(plot_corr_df_aff),
|
||||
# labels = "C",
|
||||
# label_size = 12)
|
||||
# dev.off()
|
||||
|
||||
#png("/home/tanu/tmp/gg_pairs_all.png", height = 6, width=11.75, unit="in",res=300)
|
||||
#### Combine A ####
|
||||
png(paste0(outdir_images
|
||||
,tolower(gene)
|
||||
,"_CorrAB.png"), height = 7, width=11.75, unit="in",res=300)
|
||||
,"_CorrA.png"), height =8, width=8, unit="in",res=300)
|
||||
|
||||
cowplot::plot_grid(ggmatrix_gtable(plot_corr_df_ps),
|
||||
ggmatrix_gtable(plot_corr_df_cons),
|
||||
labels = "A",
|
||||
label_size = 12)
|
||||
dev.off()
|
||||
|
||||
#### Combine B+C ####
|
||||
# B + C
|
||||
png(paste0(outdir_images
|
||||
,tolower(gene)
|
||||
,"_CorrBC.png"), height = 6, width=11.75, unit="in",res=300)
|
||||
|
||||
cowplot::plot_grid(ggmatrix_gtable(plot_corr_df_cons),
|
||||
ggmatrix_gtable(plot_corr_df_aff),
|
||||
# ggmatrix_gtable(plot_corr_df_aff),
|
||||
# nrow=1, ncol=3, rel_heights = 7,7,3
|
||||
nrow=1,
|
||||
rel_widths = c(1.5,1),
|
||||
labels = "AUTO",
|
||||
#rel_heights = 1,1
|
||||
labels = c("B", "C"),
|
||||
label_size = 12)
|
||||
dev.off()
|
||||
|
||||
# affinity corr
|
||||
#png("/home/tanu/tmp/gg_pairs_affinity.png", height =7, width=7, unit="in",res=300)
|
||||
png(paste0(outdir_images
|
||||
,tolower(gene)
|
||||
,"_CorrC.png"), height =7, width=7, unit="in",res=300)
|
||||
|
||||
cowplot::plot_grid(ggmatrix_gtable(plot_corr_df_aff),
|
||||
labels = "C",
|
||||
label_size = 12)
|
||||
dev.off()
|
||||
|
|
2
scripts/plotting/plotting_thesis/gid/gid_other_plots.R
Normal file
2
scripts/plotting/plotting_thesis/gid/gid_other_plots.R
Normal file
|
@ -0,0 +1,2 @@
|
|||
|
||||
source("/home/tanu/git/LSHTM_analysis/scripts/plotting/plotting_thesis/linage_bp_dist_layout.R")
|
173
scripts/plotting/plotting_thesis/gid/pe_sens_site_count_gid.R
Normal file
173
scripts/plotting/plotting_thesis/gid/pe_sens_site_count_gid.R
Normal file
|
@ -0,0 +1,173 @@
|
|||
source("/home/tanu/git/LSHTM_analysis/scripts/plotting/plotting_thesis/gid/prominent_effects_gid.R")
|
||||
source("/home/tanu/git/LSHTM_analysis/scripts/plotting/plotting_thesis/gid/sensitivity_count_gid.R")
|
||||
|
||||
##############################################################
|
||||
# PE count
|
||||
#lig-- na--ppi2--stab
|
||||
# pe_colour_map = c("DD_lig" = "#ffd700" # gold
|
||||
# , "SS_lig" = "#f0e68c" # khaki
|
||||
#
|
||||
# , "DD_nucleic_acid"= "#a0522d" # sienna
|
||||
# , "SS_nucleic_acid"= "#d2b48c" # tan
|
||||
#
|
||||
# , "DD_ppi2" = "#da70d6" # orchid
|
||||
# , "SS_ppi2" = "#ff1493" # deeppink
|
||||
#
|
||||
# , "DD_stability" = "#f8766d" # red
|
||||
# , "SS_stability" = "#00BFC4") # blue
|
||||
table(str_df_plot_cols$pe_effect_outcome)
|
||||
##############################################################
|
||||
#===========
|
||||
#PE count
|
||||
#===========
|
||||
rects <- data.frame(x=1:6,
|
||||
colors = c("#ffd700" ,
|
||||
"#f0e68c" ,
|
||||
|
||||
"#a0522d" ,
|
||||
"#d2b48c" ,
|
||||
|
||||
"#f8766d" ,
|
||||
"#00BFC4")
|
||||
)
|
||||
|
||||
rects$text = c("-ve Lig"
|
||||
, "+ve Lig"
|
||||
|
||||
, "-ve\nNuc.Acid"
|
||||
, "+ve\nNuc.Acid"
|
||||
|
||||
, "-ve stability"
|
||||
, "+ve stability"
|
||||
)
|
||||
|
||||
cell1 = table(str_df_plot_cols$pe_effect_outcome)[["DD_lig"]]
|
||||
cell2 = 0
|
||||
|
||||
cell3 = table(str_df_plot_cols$pe_effect_outcome)[["DD_nucleic_acid"]]
|
||||
cell4 = table(str_df_plot_cols$pe_effect_outcome)[["SS_nucleic_acid"]]
|
||||
|
||||
#cell5 = table(str_df_plot_cols$pe_effect_outcome)[["DD_ppi2"]]
|
||||
#cell6 = table(str_df_plot_cols$pe_effect_outcome)[["SS_ppi2"]]
|
||||
|
||||
cell7 = table(str_df_plot_cols$pe_effect_outcome)[["DD_stability"]]
|
||||
cell8 = table(str_df_plot_cols$pe_effect_outcome)[["SS_stability"]]
|
||||
|
||||
|
||||
#rects$numbers = c(38, 0, 22, 9, 108, 681) #for embb
|
||||
rects$numbers = c(cell1, cell2,
|
||||
cell3, cell4,
|
||||
# cell5, cell6,
|
||||
cell7, cell8)
|
||||
|
||||
rects$num_labels = paste0("n=", rects$numbers)
|
||||
|
||||
rects
|
||||
#------
|
||||
# Plot
|
||||
#------
|
||||
#https://stackoverflow.com/questions/47986055/create-a-rectangle-filled-with-text
|
||||
peP = ggplot(rects, aes(x, y = 0, fill = colors, label = paste0(text,"\n", num_labels))) +
|
||||
geom_tile(width = 1, height = 1) + # make square tiles
|
||||
geom_text(color = "black", size = 1.7) + # add white text in the middle
|
||||
scale_fill_identity(guide = "none") + # color the tiles with the colors in the data frame
|
||||
coord_fixed() + # make sure tiles are square
|
||||
coord_flip()+ scale_x_reverse() +
|
||||
# theme_void() # remove any axis markings
|
||||
theme_nothing() # remove any axis markings
|
||||
peP
|
||||
|
||||
#------
|
||||
# Plot: this one is better
|
||||
#------
|
||||
peP2 = ggplot(rects, aes(x, y = 0, fill = colors, label = paste0(text,"\n", num_labels))) +
|
||||
geom_tile() + # make square tiles
|
||||
geom_text(color = "black", size = 1.6) + # add white text in the middle
|
||||
scale_fill_identity(guide = "none") + # color the tiles with the colors in the data frame
|
||||
coord_fixed() + # make sure tiles are square
|
||||
theme_nothing() # remove any axis markings
|
||||
peP2
|
||||
|
||||
########################################################
|
||||
# From: script sensitivity_count per gene
|
||||
#===============================
|
||||
# Sensitivity count: SITE
|
||||
#===============================
|
||||
#--------
|
||||
# embb
|
||||
#--------
|
||||
#rsc = 54
|
||||
#ccc = 46
|
||||
#ssc = 470
|
||||
|
||||
rsc = site_Rc; rsc
|
||||
ccc = site_Cc; ccc
|
||||
ssc = site_Sc; ssc
|
||||
|
||||
rect_rs_siteC <- data.frame(x=1:3,
|
||||
colors = c("red",
|
||||
"purple",
|
||||
"blue")
|
||||
)
|
||||
|
||||
rect_rs_siteC
|
||||
rect_rs_siteC$text = c("Resistant",
|
||||
"Common",
|
||||
"Sensitive")
|
||||
|
||||
rect_rs_siteC$numbers = c(rsc,ccc,ssc)
|
||||
rect_rs_siteC$num_labels = paste0("n=", rect_rs_siteC$numbers)
|
||||
rect_rs_siteC
|
||||
|
||||
#------
|
||||
# Plot
|
||||
#------
|
||||
sens_siteP = ggplot(rect_rs_siteC, aes(x, y = 0,
|
||||
fill = colors,
|
||||
label = num_labels
|
||||
#,label = paste0(text,"\n", num_labels)
|
||||
)) +
|
||||
geom_tile(width = 1, height = 1) +
|
||||
#geom_text(color = "black", size = 1.7) +
|
||||
geom_label(color = "black", size = 1.7,fill = "white", alpha=0.7) +
|
||||
scale_fill_identity(guide = "none") +
|
||||
coord_fixed()+
|
||||
theme_nothing() # remove any axis markings
|
||||
sens_siteP
|
||||
|
||||
################################################################
|
||||
#===============================
|
||||
# Sensitivity count: Mutations
|
||||
#===============================
|
||||
table(sensP_df$sensitivity)
|
||||
muts_Rc = table(sensP_df$sensitivity)[["R"]]
|
||||
muts_Sc = table(sensP_df$sensitivity)[["S"]]
|
||||
rect_sens <- data.frame(x=1:2,
|
||||
colors = c("red",
|
||||
"blue")
|
||||
)
|
||||
|
||||
rect_sens$text = c("Resistant",
|
||||
"Sensitive")
|
||||
rect_sens$numbers = c(muts_Rc,muts_Sc)
|
||||
rect_sens$num_labels = paste0("n=", rect_sens$numbers)
|
||||
rect_sens
|
||||
#------
|
||||
# Plot
|
||||
#------
|
||||
sensP = ggplot(rect_sens, aes(x, y = 0,
|
||||
fill = colors,
|
||||
label = paste0(text,"\n", num_labels))) +
|
||||
geom_tile(width = 1, height = 1) +
|
||||
#geom_text(color = "black", size = 1.7) +
|
||||
geom_label(color = "black", size = 1.7,fill = "white", alpha=0.7) +
|
||||
scale_fill_identity(guide = "none") +
|
||||
coord_fixed()+
|
||||
theme_nothing() # remove any axis markings
|
||||
sensP
|
||||
|
||||
sensP2 = sensP +
|
||||
coord_flip() + scale_x_reverse()
|
||||
sensP2
|
||||
|
||||
|
341
scripts/plotting/plotting_thesis/gid/prominent_effects_gid.R
Normal file
341
scripts/plotting/plotting_thesis/gid/prominent_effects_gid.R
Normal file
|
@ -0,0 +1,341 @@
|
|||
#!/usr/bin/env Rscript
|
||||
#source("~/git/LSHTM_analysis/config/gid.R")
|
||||
# get plotting dfs
|
||||
#source("~/git/LSHTM_analysis/scripts/plotting/get_plotting_dfs.R")
|
||||
########################################################
|
||||
pos_colname = "position"
|
||||
|
||||
#-------------
|
||||
# from ~/git/LSHTM_analysis/scripts/plotting/plotting_colnames.R
|
||||
#-------------
|
||||
length(all_stability_cols); length(raw_stability_cols)
|
||||
length(scaled_stability_cols); length(outcome_stability_cols)
|
||||
length(affinity_dist_colnames)
|
||||
|
||||
|
||||
static_cols = c("mutationinformation",
|
||||
#"position",
|
||||
pos_colname,
|
||||
"sensitivity")
|
||||
|
||||
other_cols_all = c(scaled_stability_cols, scaled_affinity_cols, affinity_dist_colnames)
|
||||
|
||||
#omit avg cols and foldx_scaled_signC cols
|
||||
other_cols = other_cols_all[grep("avg", other_cols_all, invert = T)]
|
||||
other_cols = other_cols[grep("foldx_scaled_signC",other_cols, invert = T )]
|
||||
other_cols
|
||||
|
||||
cols_to_extract = c(static_cols, other_cols)
|
||||
cat("\nExtracting cols:", cols_to_extract)
|
||||
expected_ncols = length(static_cols) + length(other_cols)
|
||||
expected_ncols
|
||||
|
||||
str_df = merged_df3[, cols_to_extract]
|
||||
|
||||
if (ncol(str_df) == expected_ncols){
|
||||
cat("\nPASS: successfully extracted cols for calculating prominent effects")
|
||||
}else{
|
||||
stop("\nAbort: Could not extract cols for calculating prominent effects")
|
||||
}
|
||||
|
||||
#=========================
|
||||
# Masking affinity columns
|
||||
#=========================
|
||||
# First make values for affinity cols 0 when their corresponding dist >10
|
||||
head(str_df)
|
||||
|
||||
# replace in place affinity values >10
|
||||
str_df[str_df["ligand_distance"]>10,"affinity_scaled"]=0
|
||||
str_df[str_df["ligand_distance"]>10,"mmcsm_lig_scaled"]=0
|
||||
|
||||
#ppi2 gene: replace in place ppi2 affinity values where ppi2 dist >10
|
||||
if (tolower(gene)%in%geneL_ppi2){
|
||||
str_df[str_df["interface_dist"]>10,"mcsm_ppi2_scaled"]=0
|
||||
}
|
||||
|
||||
# na gene: replace in place na affinity values where na dist >10
|
||||
if (tolower(gene)%in%geneL_na){
|
||||
str_df[str_df["nca_distance"]>10,"mcsm_na_scaled"]=0
|
||||
}
|
||||
|
||||
colnames(str_df)
|
||||
head(str_df)
|
||||
|
||||
# get names of cols to calculate the prominent effects from
|
||||
# scaled_cols_tc = c("duet_scaled",
|
||||
# "deepddg_scaled",
|
||||
# "ddg_dynamut2_scaled",
|
||||
# "foldx_scaled",
|
||||
# "affinity_scaled",
|
||||
# "mmcsm_lig_scaled",
|
||||
# "mcsm_ppi2_scaled", "mcsm_na_scaled")
|
||||
|
||||
scaled_cols_tc = other_cols[grep("scaled", other_cols)]
|
||||
###############################################
|
||||
|
||||
|
||||
#===============
|
||||
# whole df
|
||||
#===============
|
||||
give_col=function(x,y,df=str_df){
|
||||
df[df[[pos_colname]]==x,y]
|
||||
}
|
||||
|
||||
for (i in unique(str_df[[pos_colname]]) ){
|
||||
print(i)
|
||||
#cat(length(unique(str_df[[pos_colname]])))
|
||||
|
||||
biggest = max(abs(give_col(i,scaled_cols_tc)))
|
||||
|
||||
str_df[str_df[[pos_colname]]==i,'abs_max_effect'] = biggest
|
||||
str_df[str_df[[pos_colname]]==i,'effect_type']= names(
|
||||
give_col(i,scaled_cols_tc)[which(
|
||||
abs(
|
||||
give_col(i,scaled_cols_tc)
|
||||
) == biggest, arr.ind=T
|
||||
)[, "col"]])[1]
|
||||
|
||||
effect_name = unique(str_df[str_df[[pos_colname]]==i,'effect_type'])#[1] # pick first one in case we have multiple exact values
|
||||
|
||||
# get index/rowname for value of max effect, and then use it to get the original sign
|
||||
# here
|
||||
#ind = rownames(which(abs(str_df[str_df[[pos_colname]]==i,c('position',effect_name)][effect_name])== biggest, arr.ind=T))
|
||||
ind = rownames(which(abs(str_df[str_df[[pos_colname]]==i,c(pos_colname,effect_name)][effect_name])== biggest, arr.ind=T))
|
||||
|
||||
str_df[str_df[[pos_colname]]==i,'effect_sign'] = sign(str_df[effect_name][ind,])[1]
|
||||
}
|
||||
|
||||
# ends with suffix 2 if dups
|
||||
str_df$effect_type = sub("\\.[0-9]+", "", str_df$effect_type) # cull duplicate effect types that happen when there are exact duplicate values
|
||||
colnames(str_df)
|
||||
table(str_df$effect_type)
|
||||
|
||||
# check
|
||||
str_df_check = str_df[str_df[[pos_colname]]%in%c(24, 32, 160, 303, 334),]
|
||||
|
||||
#================
|
||||
# for Plots
|
||||
#================
|
||||
str_df_short = str_df[, c("mutationinformation",
|
||||
#"position",
|
||||
pos_colname,
|
||||
"sensitivity"
|
||||
, "effect_type"
|
||||
, "effect_sign")]
|
||||
|
||||
table(str_df_short$effect_type)
|
||||
table(str_df_short$effect_sign)
|
||||
str(str_df_short)
|
||||
|
||||
# assign pe outcome
|
||||
str_df_short$pe_outcome = ifelse(str_df_short$effect_sign<0, "DD", "SS")
|
||||
table(str_df_short$pe_outcome )
|
||||
table(str_df_short$effect_sign)
|
||||
|
||||
#==============
|
||||
# group effect type:
|
||||
# lig, ppi2, nuc. acid, stability
|
||||
#==============
|
||||
affcols = c("affinity_scaled", "mmcsm_lig_scaled")
|
||||
nuc_na_cols = c("mcsm_na_scaled")
|
||||
|
||||
#lig
|
||||
table(str_df_short$effect_type)
|
||||
str_df_short$effect_grouped = ifelse(str_df_short$effect_type%in%affcols
|
||||
, "lig"
|
||||
, str_df_short$effect_type)
|
||||
table(str_df_short$effect_grouped)
|
||||
|
||||
|
||||
#na
|
||||
str_df_short$effect_grouped = ifelse(str_df_short$effect_grouped%in%nuc_na_cols
|
||||
, "nucleic_acid"
|
||||
, str_df_short$effect_grouped)
|
||||
table(str_df_short$effect_grouped)
|
||||
|
||||
#stability
|
||||
str_df_short$effect_grouped = ifelse(!str_df_short$effect_grouped%in%c("lig",
|
||||
"nucleic_acid")
|
||||
, "stability"
|
||||
, str_df_short$effect_grouped)
|
||||
|
||||
table(str_df_short$effect_grouped)
|
||||
|
||||
# create a sign as well
|
||||
str_df_short$pe_effect_outcome = paste0(str_df_short$pe_outcome, "_"
|
||||
, str_df_short$effect_grouped)
|
||||
|
||||
table(str_df_short$pe_effect_outcome)
|
||||
|
||||
#####################################################################
|
||||
# Chimera: for colouring
|
||||
####################################################################
|
||||
|
||||
#-------------------------------------
|
||||
# get df with unique position
|
||||
#--------------------------------------
|
||||
#data[!duplicated(data$x), ]
|
||||
str_df_plot = str_df_short[!duplicated(str_df[[pos_colname]]),]
|
||||
|
||||
if (nrow(str_df_plot) == length(unique(str_df[[pos_colname]]))){
|
||||
cat("\nPASS: successfully extracted df with unique positions")
|
||||
}else{
|
||||
stop("\nAbort: Could not extract df with unique positions")
|
||||
}
|
||||
|
||||
#-------------------------------------
|
||||
# generate colours for effect types
|
||||
#--------------------------------------
|
||||
str_df_plot_cols = str_df_plot[, c(pos_colname,
|
||||
"sensitivity",
|
||||
"pe_outcome",
|
||||
"effect_grouped",
|
||||
"pe_effect_outcome")]
|
||||
head(str_df_plot_cols)
|
||||
|
||||
# colour intensity based on sign
|
||||
#str_df_plot_cols$colour_hue = ifelse(str_df_plot_cols$effect_sign<0, "bright", "light")
|
||||
str_df_plot_cols$colour_hue = ifelse(str_df_plot_cols$pe_outcome=="DD", "bright", "light")
|
||||
|
||||
table(str_df_plot_cols$colour_hue); table(str_df_plot$pe_outcome)
|
||||
head(str_df_plot_cols)
|
||||
|
||||
# colour based on effect
|
||||
table(str_df_plot_cols$pe_effect_outcome)
|
||||
|
||||
# colors = c("#ffd700" #gold
|
||||
# , "#f0e68c" #khaki
|
||||
# , "#da70d6"# orchid
|
||||
# , "#ff1493"# deeppink
|
||||
# , "#a0522d" #sienna
|
||||
# , "#d2b48c" # tan
|
||||
# , "#00BFC4" #, "#007d85" #blue
|
||||
# , "#F8766D" )# red
|
||||
|
||||
pe_colour_map = c("DD_lig" = "#ffd700" # gold
|
||||
, "SS_lig" = "#f0e68c" # khaki
|
||||
|
||||
, "DD_nucleic_acid"= "#a0522d" # sienna
|
||||
, "SS_nucleic_acid"= "#d2b48c" # tan
|
||||
|
||||
, "DD_ppi2" = "#da70d6" # orchid
|
||||
, "SS_ppi2" = "#ff1493" # deeppink
|
||||
|
||||
, "DD_stability" = "#f8766d" # red
|
||||
, "SS_stability" = "#00BFC4") # blue
|
||||
|
||||
#unlist(d[c('a', 'a', 'c', 'b')], use.names=FALSE)
|
||||
|
||||
#map the colours
|
||||
str_df_plot_cols$colour_map= unlist(map(str_df_plot_cols$pe_effect_outcome
|
||||
,function(x){pe_colour_map[[x]]}
|
||||
))
|
||||
head(str_df_plot_cols$colour_map)
|
||||
table(str_df_plot_cols$colour_map)
|
||||
table(str_df_plot_cols$pe_effect_outcome)
|
||||
|
||||
# str_df_plot_cols$colours = paste0(str_df_plot_cols$colour_hue
|
||||
# , "_"
|
||||
# , str_df_plot_cols$colour_map)
|
||||
# head(str_df_plot_cols$colours)
|
||||
# table(str_df_plot_cols$colours)
|
||||
#
|
||||
#
|
||||
# class(str_df_plot_cols$colour_map)
|
||||
# str(str_df_plot_cols)
|
||||
|
||||
# sort by colour
|
||||
head(str_df_plot_cols)
|
||||
str_df_plot_cols = str_df_plot_cols[order(str_df_plot_cols$colour_map), ]
|
||||
head(str_df_plot_cols)
|
||||
|
||||
#======================================
|
||||
# write file with prominent effects
|
||||
#======================================
|
||||
outdir_images = paste0("~/git/Writing/thesis/images/results/", tolower(gene), "/")
|
||||
write.csv(str_df_plot_cols, paste0(outdir_images, tolower(gene), "_prominent_effects.csv"))
|
||||
|
||||
################################
|
||||
# printing for chimera
|
||||
###############################
|
||||
chain_suffix = ".A"
|
||||
str_df_plot_cols$pos_chain = paste0(str_df_plot_cols[[pos_colname]], chain_suffix)
|
||||
table(str_df_plot_cols$colour_map)
|
||||
table(str_df_plot_cols$pe_effect_outcome)
|
||||
|
||||
#===================================================
|
||||
#-------------------
|
||||
# Ligand Affinity
|
||||
#-------------------
|
||||
# -ve Lig Aff
|
||||
dd_lig = str_df_plot_cols[str_df_plot_cols$pe_effect_outcome=="DD_lig",]
|
||||
if (nrow(dd_lig) == table(str_df_plot_cols$pe_effect_outcome)[['DD_lig']]){
|
||||
dd_lig_pos = dd_lig[[pos_colname]]
|
||||
}else{
|
||||
stop("Abort: DD affinity colour numbers mismtatch")
|
||||
}
|
||||
|
||||
# +ve Lig Aff
|
||||
ss_lig = str_df_plot_cols[str_df_plot_cols$pe_effect_outcome=="SS_lig",]
|
||||
if (!empty(ss_lig)){
|
||||
if (nrow(ss_lig) == table(str_df_plot_cols$pe_effect_outcome)[['SS_lig']]){
|
||||
ss_lig_pos = ss_lig[[pos_colname]]
|
||||
}else{
|
||||
stop("Abort: SS affinity colour numbers mismtatch")
|
||||
}
|
||||
#put in chimera cmd
|
||||
paste0(dd_lig_pos,chain_suffix)
|
||||
paste0(ss_lig_pos,chain_suffix)
|
||||
|
||||
}
|
||||
|
||||
#===================================================
|
||||
#------------------------
|
||||
# Nucleic Acid Affinity
|
||||
#------------------------
|
||||
# -ve NA aff
|
||||
dd_nca = str_df_plot_cols[str_df_plot_cols$pe_effect_outcome=="DD_nucleic_acid",]
|
||||
if (nrow(dd_nca) == table(str_df_plot_cols$pe_effect_outcome)[['DD_nucleic_acid']]){
|
||||
dd_nca_pos = dd_nca[[pos_colname]]
|
||||
}else{
|
||||
stop("Abort: DD nucleic_acid colour numbers mismtatch")
|
||||
}
|
||||
|
||||
# +ve NA aff
|
||||
ss_nca = str_df_plot_cols[str_df_plot_cols$pe_effect_outcome=="SS_nucleic_acid",]
|
||||
if (nrow(ss_nca) == table(str_df_plot_cols$pe_effect_outcome)[['SS_nucleic_acid']]){
|
||||
ss_nca_pos = ss_nca[[pos_colname]]
|
||||
}else{
|
||||
stop("Abort: SS nucleic_acid colour numbers mismtatch")
|
||||
}
|
||||
|
||||
#put in chimera cmd
|
||||
paste0(dd_nca_pos, chain_suffix)
|
||||
paste0(ss_nca_pos, chain_suffix)
|
||||
|
||||
#=========================================================
|
||||
#------------------------
|
||||
# Stability
|
||||
#------------------------
|
||||
# -ve Stability
|
||||
dd_stability = str_df_plot_cols[str_df_plot_cols$pe_effect_outcome=="DD_stability",]
|
||||
if (nrow(dd_stability) == table(str_df_plot_cols$pe_effect_outcome)[['DD_stability']]){
|
||||
dd_stability_pos = dd_stability[[pos_colname]]
|
||||
}else{
|
||||
stop("Abort: DD Stability colour numbers mismtatch")
|
||||
}
|
||||
|
||||
# +ve Stability
|
||||
ss_stability = str_df_plot_cols[str_df_plot_cols$pe_effect_outcome=="SS_stability",]
|
||||
if (nrow(ss_stability) == table(str_df_plot_cols$pe_effect_outcome)[['SS_stability']]){
|
||||
ss_stability_pos = ss_stability[[pos_colname]]
|
||||
}else{
|
||||
stop("Abort: SS Stability colour numbers mismtatch")
|
||||
}
|
||||
|
||||
#put in chimera cmd
|
||||
# stabiliting first as it has less numbers
|
||||
paste0(ss_stability_pos, chain_suffix)
|
||||
paste0(dd_stability_pos, chain_suffix)
|
||||
####################################################################
|
||||
|
65
scripts/plotting/plotting_thesis/gid/sensitivity_count_gid.R
Normal file
65
scripts/plotting/plotting_thesis/gid/sensitivity_count_gid.R
Normal file
|
@ -0,0 +1,65 @@
|
|||
#=========================
|
||||
# Count Sensitivity
|
||||
# Mutations and positions
|
||||
#=========================
|
||||
pos_colname_c ="position"
|
||||
|
||||
sensP_df = merged_df3[,c("mutationinformation",
|
||||
#"position",
|
||||
pos_colname_c,
|
||||
"sensitivity")]
|
||||
|
||||
head(sensP_df)
|
||||
table(sensP_df$sensitivity)
|
||||
|
||||
#---------------
|
||||
# Total unique positions
|
||||
#----------------
|
||||
tot_mut_pos = length(unique(sensP_df[[pos_colname_c]]))
|
||||
cat("\nNo of Tot muts sites:", tot_mut_pos)
|
||||
|
||||
# resistant mut pos
|
||||
sens_site_allR = sensP_df[[pos_colname_c]][sensP_df$sensitivity=="R"]
|
||||
sens_site_UR = unique(sens_site_allR)
|
||||
length(sens_site_UR)
|
||||
|
||||
# Sensitive mut pos
|
||||
sens_site_allS = sensP_df[[pos_colname_c]][sensP_df$sensitivity=="S"]
|
||||
sens_site_US = unique(sens_site_allS)
|
||||
length(sens_site_UR)
|
||||
|
||||
#---------------
|
||||
# Common Sites
|
||||
#----------------
|
||||
common_pos = intersect(sens_site_UR,sens_site_US)
|
||||
site_Cc = length(common_pos)
|
||||
cat("\nNo of Common sites:", site_Cc
|
||||
, "\nThese are:", common_pos)
|
||||
|
||||
#---------------
|
||||
# Resistant muts
|
||||
#----------------
|
||||
site_R = sens_site_UR[!sens_site_UR%in%common_pos]
|
||||
site_Rc = length(site_R)
|
||||
|
||||
if ( length(sens_site_allR) == table(sensP_df$sensitivity)[['R']] ){
|
||||
cat("\nNo of R muts:", length(sens_site_allR)
|
||||
, "\nNo. of R sites:",site_Rc
|
||||
, "\nThese are:", site_R
|
||||
)
|
||||
}
|
||||
|
||||
#---------------
|
||||
# Sensitive muts
|
||||
#----------------
|
||||
site_S = sens_site_US[!sens_site_US%in%common_pos]
|
||||
site_Sc = length(site_S)
|
||||
|
||||
if ( length(sens_site_allS) == table(sensP_df$sensitivity)[['S']] ){
|
||||
cat("\nNo of S muts:", length(sens_site_allS)
|
||||
, "\nNo. of S sites:", site_Sc
|
||||
, "\nThese are:", site_S)
|
||||
}
|
||||
|
||||
#########################
|
||||
|
Loading…
Add table
Add a link
Reference in a new issue