added commonly used mutation format for missense muts in the gene_specific nssnp_info file

This commit is contained in:
Tanushree Tunstall 2020-06-24 13:34:35 +01:00
parent a9498f8e08
commit 27a656dba1
4 changed files with 194 additions and 568 deletions

View file

@ -221,9 +221,9 @@ else:
print('FAIL: Second cross check unsuccessfull. Debug please!')
sys.exit()
#%% extract mut info into three cols
orig_len = len(dfm2_mis.columns)
#%% extract mut info into three cols
dfm2_mis['wild_type'] = dfm2_mis['mut_info'].str.extract('(\w{1})>')
dfm2_mis['position'] = dfm2_mis['mut_info'].str.extract('(\d+)')
dfm2_mis['mutant_type'] = dfm2_mis['mut_info'].str.extract('>\d+(\w{1})')