added cmd option for dynamut2 formatting results
This commit is contained in:
parent
c5c4d74acf
commit
a67a07db2d
7 changed files with 65 additions and 16 deletions
0
dynamut/format_results_dynamut.py
Normal file → Executable file
0
dynamut/format_results_dynamut.py
Normal file → Executable file
0
dynamut/format_results_dynamut2.py
Normal file → Executable file
0
dynamut/format_results_dynamut2.py
Normal file → Executable file
47
dynamut/run_format_results_dynamut.py
Normal file → Executable file
47
dynamut/run_format_results_dynamut.py
Normal file → Executable file
|
@ -20,8 +20,45 @@ from format_results_dynamut2 import *
|
||||||
# variables
|
# variables
|
||||||
# TODO: add cmd line args
|
# TODO: add cmd line args
|
||||||
|
|
||||||
gene = 'gid'
|
#gene =
|
||||||
drug = 'streptomycin'
|
#drug =
|
||||||
|
|
||||||
|
#%% command line args
|
||||||
|
arg_parser = argparse.ArgumentParser()
|
||||||
|
arg_parser.add_argument('-d', '--drug', help='drug name (case sensitive)', default = None)
|
||||||
|
arg_parser.add_argument('-g', '--gene', help='gene name (case sensitive)', default = None)
|
||||||
|
arg_parser.add_argument('--datadir', help = 'Data Directory. By default, it assmumes homedir + git/Data')
|
||||||
|
arg_parser.add_argument('-i', '--input_dir', help = 'Input dir containing pdb files. By default, it assmumes homedir + <drug> + input')
|
||||||
|
arg_parser.add_argument('-o', '--output_dir', help = 'Output dir for results. By default, it assmes homedir + <drug> + output')
|
||||||
|
#arg_parser.add_argument('-m', '--make_dirs', help = 'Make dir for input and output', action='store_true') # should be handled elsewhere!
|
||||||
|
|
||||||
|
arg_parser.add_argument('--debug', action ='store_true', help = 'Debug Mode')
|
||||||
|
|
||||||
|
args = arg_parser.parse_args()
|
||||||
|
#=======================================================================
|
||||||
|
#%% variable assignment: input and output paths & filenames
|
||||||
|
drug = args.drug
|
||||||
|
gene = args.gene
|
||||||
|
datadir = args.datadir
|
||||||
|
indir = args.input_dir
|
||||||
|
outdir = args.output_dir
|
||||||
|
#make_dirs = args.make_dirs
|
||||||
|
|
||||||
|
#%% input and output dirs and files
|
||||||
|
#=======
|
||||||
|
# dirs
|
||||||
|
#=======
|
||||||
|
if not datadir:
|
||||||
|
datadir = homedir + '/' + 'git/Data'
|
||||||
|
|
||||||
|
if not indir:
|
||||||
|
indir = datadir + '/' + drug + '/input'
|
||||||
|
|
||||||
|
if not outdir:
|
||||||
|
outdir = datadir + '/' + drug + '/output'
|
||||||
|
|
||||||
|
#%%=====================================================================
|
||||||
|
|
||||||
datadir = homedir + '/git/Data'
|
datadir = homedir + '/git/Data'
|
||||||
indir = datadir + '/' + drug + '/input'
|
indir = datadir + '/' + drug + '/input'
|
||||||
outdir = datadir + '/' + drug + '/output'
|
outdir = datadir + '/' + drug + '/output'
|
||||||
|
@ -29,12 +66,12 @@ outdir_dynamut = outdir + '/dynamut_results/'
|
||||||
outdir_dynamut2 = outdir + '/dynamut_results/dynamut2/'
|
outdir_dynamut2 = outdir + '/dynamut_results/dynamut2/'
|
||||||
|
|
||||||
# Input file
|
# Input file
|
||||||
infile_dynamut = outdir_dynamut + gene + '_dynamut_all_output_clean.csv'
|
#infile_dynamut = outdir_dynamut + gene + '_dynamut_all_output_clean.csv'
|
||||||
infile_dynamut2 = outdir_dynamut2 + gene + '_dynamut2_output_combined_clean.csv'
|
infile_dynamut2 = outdir_dynamut2 + gene + '_dynamut2_output_combined_clean.csv'
|
||||||
|
|
||||||
# Formatted output filename
|
# Formatted output filename
|
||||||
outfile_dynamut_f = outdir_dynamut2 + gene + '_complex_dynamut_norm.csv'
|
#outfile_dynamut_f = outdir_dynamut2 + gene + '_dynamut_norm.csv'
|
||||||
outfile_dynamut2_f = outdir_dynamut2 + gene + '_complex_dynamut2_norm.csv'
|
outfile_dynamut2_f = outdir_dynamut2 + gene + '_dynamut2_norm.csv'
|
||||||
|
|
||||||
#===============================
|
#===============================
|
||||||
# CALL: format_results_dynamut
|
# CALL: format_results_dynamut
|
||||||
|
|
|
@ -17,8 +17,8 @@ my_host = 'http://biosig.unimelb.edu.au'
|
||||||
#headers = {"User-Agent":"Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_4) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/83.0.4103.97 Safari/537.36"}
|
#headers = {"User-Agent":"Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_4) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/83.0.4103.97 Safari/537.36"}
|
||||||
|
|
||||||
# TODO: add cmd line args
|
# TODO: add cmd line args
|
||||||
#gene = 'gid'
|
# gene =
|
||||||
drug = 'streptomycin'
|
# drug =
|
||||||
datadir = homedir + '/git/Data/'
|
datadir = homedir + '/git/Data/'
|
||||||
indir = datadir + drug + '/input/'
|
indir = datadir + drug + '/input/'
|
||||||
outdir = datadir + drug + '/output/'
|
outdir = datadir + drug + '/output/'
|
||||||
|
|
|
@ -13,10 +13,25 @@ CHUNK=$3
|
||||||
mkdir -p ${OUTDIR}/${CHUNK}/chain_added
|
mkdir -p ${OUTDIR}/${CHUNK}/chain_added
|
||||||
cd ${OUTDIR}/${CHUNK}/chain_added
|
cd ${OUTDIR}/${CHUNK}/chain_added
|
||||||
|
|
||||||
# makes the 2 dirs, hence ../..
|
# makes the 3 dirs, hence ../..
|
||||||
split ../../../${INFILE} -l ${CHUNK} -d snp_batch_
|
split ../../../${INFILE} -l ${CHUNK} -d snp_batch_
|
||||||
|
|
||||||
# use case
|
########################################################################
|
||||||
#~/git/LSHTM_analysis/dynamut/split_csv_chain.sh katg_mcsm_formatted_snps.csv snp_batches 50 #Date: 20/09/2021
|
# use cases
|
||||||
|
# Date: 20/09/2021
|
||||||
|
# sed -e 's/^/A /g' katg_mcsm_formatted_snps.csv > katg_mcsm_formatted_snps_chain.csv
|
||||||
|
#~/git/LSHTM_analysis/dynamut/split_csv_chain.sh katg_mcsm_formatted_snps_chain.csv snp_batches 50
|
||||||
|
|
||||||
|
# Date: 01/10/2021
|
||||||
|
# sed -e 's/^/A /g' rpob_mcsm_formatted_snps.csv > rpob_mcsm_formatted_snps_chain.csv
|
||||||
|
#~/git/LSHTM_analysis/dynamut/split_csv_chain.sh rpob_mcsm_formatted_snps_chain.csv snp_batches 50
|
||||||
|
|
||||||
|
# Date: 02/10/2021
|
||||||
|
# sed -e 's/^/A /g' alr_mcsm_formatted_snps.csv > alr_mcsm_formatted_snps_chain.csv
|
||||||
|
#~/git/LSHTM_analysis/dynamut/split_csv_chain.sh alr_mcsm_formatted_snps_chain.csv snp_batches 50
|
||||||
|
|
||||||
|
# Date: 05/10/2021
|
||||||
|
#~/git/LSHTM_analysis/dynamut/split_csv_chain.sh alr_mcsm_formatted_snps_chain.csv snp_batches 20
|
||||||
|
|
||||||
# add .txt to the files
|
# add .txt to the files
|
||||||
|
########################################################################
|
||||||
|
|
|
@ -81,9 +81,6 @@ indir = args.input_dir
|
||||||
outdir = args.output_dir
|
outdir = args.output_dir
|
||||||
make_dirs = args.make_dirs
|
make_dirs = args.make_dirs
|
||||||
|
|
||||||
#drug = 'streptomycin'
|
|
||||||
#gene = 'gid'
|
|
||||||
|
|
||||||
#%% input and output dirs and files
|
#%% input and output dirs and files
|
||||||
#=======
|
#=======
|
||||||
# dirs
|
# dirs
|
||||||
|
|
0
scripts/deepddg_format.py
Normal file → Executable file
0
scripts/deepddg_format.py
Normal file → Executable file
Loading…
Add table
Add a link
Reference in a new issue