@@ -82,7 +82,7 @@ def map_mutations(mutation_data, improve_id_data, entrez_data):
8282 mapped_mutation_data = mapped_mutation_data .rename (columns = {'Entrez_Gene_Id' :'entrez_id' ,'Genome_Change' :'mutation' ,'Variant_Classification' :'variant_classification' })
8383 mapped_mutation_data = mapped_mutation_data .drop (columns = ['Hugo_Symbol' ,'Tumor_Sample_Barcode' ,'other_id' ])
8484 mapped_mutation_data ['source' ] = "vandeWetering_2015"
85- mapped_mutation_data ['study' ] = "crcPDO "
85+ mapped_mutation_data ['study' ] = "crcpdo "
8686 mapped_mutation_data = mapped_mutation_data .astype ({'entrez_id' :'int' })
8787
8888 return (mapped_mutation_data )
@@ -136,7 +136,7 @@ def map_transcriptomics(transciptomics_data, improve_id_data, entrez_data):
136136 # clean up column names and data types
137137 mapped_transcriptomics_df = mapped_transcriptomics_df .drop (columns = ['stable_id' ,'patient' ,'other_id' ])
138138 mapped_transcriptomics_df ['source' ] = "vandeWetering_2015"
139- mapped_transcriptomics_df ['study' ] = "crcPDO "
139+ mapped_transcriptomics_df ['study' ] = "crcpdo "
140140 mapped_transcriptomics_df = mapped_transcriptomics_df .astype ({'entrez_id' :'int' ,'improve_sample_id' :'int' })
141141 mapped_transcriptomics_df = mapped_transcriptomics_df [['entrez_id' ,'transcriptomics' ,'improve_sample_id' ,'source' ,'study' ]]
142142
@@ -198,7 +198,7 @@ def map_copy_number(copy_number_data, improve_id_data, entrez_data):
198198 # clean up columns and data types
199199 improve_mapped_cn_df = improve_mapped_cn_df .drop (columns = ['ID' ,'score' ,'other_id' ])
200200 improve_mapped_cn_df ['source' ] = "vandeWetering_2015"
201- improve_mapped_cn_df ['study' ] = "crcPDO "
201+ improve_mapped_cn_df ['study' ] = "crcpdo "
202202 improve_mapped_cn_df = improve_mapped_cn_df .rename (columns = {'ENTREZID' :'entrez_id' })
203203 improve_mapped_cn_df = improve_mapped_cn_df .astype ({'entrez_id' :'int' ,'improve_sample_id' :'int' })
204204 improve_mapped_cn_df = improve_mapped_cn_df [['entrez_id' ,'copy_number' ,'copy_call' ,'study' ,'source' ,'improve_sample_id' ]]
@@ -241,8 +241,8 @@ def map_copy_number(copy_number_data, improve_id_data, entrez_data):
241241 exit ()
242242 else :
243243 print ("Starting transcriptomics data." )
244- transcriptomics_df = map_transcriptomics (transciptomics_data = "/tmp/GSE65253_col_tum_org_merge.csv.gz" , improve_id_data = "/tmp/crcPDO_samples .csv" , entrez_data = "/tmp/genes.csv" )
245- transcriptomics_df .to_csv ("/tmp/crcPDO_transcriptomics .csv" , index = False )
244+ transcriptomics_df = map_transcriptomics (transciptomics_data = "/tmp/GSE65253_col_tum_org_merge.csv.gz" , improve_id_data = "/tmp/crcpdo_samples .csv" , entrez_data = "/tmp/genes.csv" )
245+ transcriptomics_df .to_csv ("/tmp/crcpdo_transcriptomics .csv" , index = False )
246246
247247 if args .mutations :
248248 if args .genes is None or args .genes == '' :
@@ -253,8 +253,8 @@ def map_copy_number(copy_number_data, improve_id_data, entrez_data):
253253 exit ()
254254 else :
255255 print ("Starting mutations data." )
256- mutation_df = map_mutations (mutation_data = "/tmp/mutation_data.csv" , improve_id_data = "/tmp/crcPDO_samples .csv" , entrez_data = "/tmp/genes.csv" )
257- mutation_df .to_csv ("/tmp/crcPDO_mutations .csv" , index = False )
256+ mutation_df = map_mutations (mutation_data = "/tmp/mutation_data.csv" , improve_id_data = "/tmp/crcpdo_samples .csv" , entrez_data = "/tmp/genes.csv" )
257+ mutation_df .to_csv ("/tmp/crcpdo_mutations .csv" , index = False )
258258
259259 if args .copy_number :
260260 if args .genes is None or args .genes == '' :
@@ -265,6 +265,6 @@ def map_copy_number(copy_number_data, improve_id_data, entrez_data):
265265 exit ()
266266 else :
267267 print ("Starting copy number data." )
268- mutation_df = map_copy_number (copy_number_data = "/tmp/copy_num_data.csv" , improve_id_data = "/tmp/crcPDO_samples .csv" , entrez_data = "/tmp/genes.csv" )
269- mutation_df .to_csv ("/tmp/crcPDO_copy_number .csv" , index = False )
268+ mutation_df = map_copy_number (copy_number_data = "/tmp/copy_num_data.csv" , improve_id_data = "/tmp/crcpdo_samples .csv" , entrez_data = "/tmp/genes.csv" )
269+ mutation_df .to_csv ("/tmp/crcpdo_copy_number .csv" , index = False )
270270
0 commit comments