@@ -103,10 +103,10 @@ def map_transcriptomics(transciptomics_data, improve_id_data, entrez_data):
103103 # move row names to a column called "stable_id" and format gene names to remove the chromosome num
104104 transciptomics_data ['stable_id' ] = transciptomics_data .index
105105 transciptomics_data ['stable_id' ] = transciptomics_data ['stable_id' ].str .split ('__' ,n = 1 ,expand = True ).iloc [:,0 ]
106- transciptomics_data .to_csv ("/tmp/counts_for_tpm_conversion.csv" )
106+ transciptomics_data .to_csv ("/tmp/counts_for_tpm_conversion.tsv" , sep = ' \t ' )
107107
108108 # run tpmFromCounts.py to convert counts to tpm
109- os .system ("python3 tpmFromCounts.py --counts /tmp/counts_for_tpm_conversion.csv --genome_build https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/001/405/GCF_000001405.13_GRCh37/GCF_000001405.13_GRCh37_genomic.gtf.gz --gene_col stable_id --exclude_col stable_id --out_file /tmp/transcriptomics_tpm.tsv" )
109+ os .system ("python3 tpmFromCounts.py --counts /tmp/counts_for_tpm_conversion.tsv --genome_build https://ftp.ncbi.nlm.nih.gov/genomes/all/GCF/000/001/405/GCF_000001405.13_GRCh37/GCF_000001405.13_GRCh37_genomic.gtf.gz --gene_col stable_id --exclude_col stable_id --out_file /tmp/transcriptomics_tpm.tsv" )
110110
111111 # get output from script (in tsv format) and average across organoids from each patient ]
112112 tpm_transciptomics_data = pd .read_csv ("/tmp/transcriptomics_tpm.tsv" , sep = "\t " )
@@ -266,5 +266,5 @@ def map_copy_number(copy_number_data, improve_id_data, entrez_data):
266266 else :
267267 print ("Starting copy number data." )
268268 mutation_df = map_copy_number (copy_number_data = "/tmp/copy_num_data.csv" , improve_id_data = "/tmp/crc_organoids_samples.csv" , entrez_data = "/tmp/genes.csv" )
269- mutation_df .to_csv ("/tmp/crc_organoids_copynumber .csv" , index = False )
269+ mutation_df .to_csv ("/tmp/crc_organoids_copy_number .csv" , index = False )
270270
0 commit comments