Skip to content

Commit b9676e6

Browse files
committed
Merge remote-tracking branch 'refs/remotes/origin/drop_drugs' into drop_drugs
2 parents 56b8ea8 + 65c2570 commit b9676e6

2 files changed

Lines changed: 9 additions & 4 deletions

File tree

build/beatAML/GetBeatAML.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -473,6 +473,7 @@ def map_and_combine(df, data_type, entrez_map_file, improve_map_file, map_file=N
473473
mapped_df['entrez_id'] = mapped_df['entrez_id'].astype(int)
474474
mapped_df['source'] = 'synapse'
475475
mapped_df['study'] = 'BeatAML'
476+
mapped_df =mapped_df.drop_duplicates()
476477

477478
final_dataframe = mapped_df.dropna()
478479
return final_dataframe

build/mpnst/01_mpnst_get_omics.R

Lines changed: 8 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -46,21 +46,25 @@ manifest<-synapser::synTableQuery("select * from syn53503360")$asDataFrame()|>
4646
##they each get their own sample identifier
4747
pdx_data<-manifest|>dplyr::select(common_name,starts_with("PDX"))|>
4848
left_join(pdx_samps)|>
49-
dplyr::select(improve_sample_id,common_name,model_type,RNASeq='PDX_RNASeq',Mutations='PDX_Somatic_Mutations',CopyNumber='PDX_CNV',Proteomics='PDX_Proteomics')
49+
dplyr::select(improve_sample_id,common_name,model_type,RNASeq='PDX_RNASeq',Mutations='PDX_Somatic_Mutations',CopyNumber='PDX_CNV',Proteomics='PDX_Proteomics')|>
50+
subset(!is.na(improve_sample_id)
5051

5152
tumor_data<- manifest|>dplyr::select(common_name,starts_with("Tumor"))|>
5253
left_join(tumor_samps)|>
5354
dplyr::select(improve_sample_id,common_name,model_type,RNASeq='Tumor_RNASeq',Mutations='Tumor_Somatic_Mutations',CopyNumber='Tumor_CNV')|>
54-
mutate(Proteomics='') ##we dont have tumor proteomics from these samples
55+
mutate(Proteomics='')|>
56+
subset(!is.na(improve_sample_id)
57+
##we dont have tumor proteomics from these samples
5558
#print(tumor_data)
5659

5760
mt_data<- manifest|>dplyr::select(common_name,starts_with("PDX"))|>
5861
left_join(mt_samps)|>
59-
dplyr::select(improve_sample_id,common_name,model_type, RNASeq='PDX_RNASeq',Mutations='PDX_Somatic_Mutations',CopyNumber='PDX_CNV',Proteomics='PDX_Proteomics')##we dont have mt data yet, so collecting PDX instead
62+
dplyr::select(improve_sample_id,common_name,model_type, RNASeq='PDX_RNASeq',Mutations='PDX_Somatic_Mutations',CopyNumber='PDX_CNV',Proteomics='PDX_Proteomics')|>##we dont have mt data yet, so collecting PDX instead
63+
subset(!is.na(improve_sample_id)
6064
#print(tumor_data)
6165

6266

63-
combined<-rbind(pdx_data,tumor_data)|>distinct()
67+
combined<-rbind(pdx_data,tumor_data,mt_data)|>distinct()
6468

6569
# gene mapping table
6670
genes_df <- fread(genefile)

0 commit comments

Comments
 (0)