Skip to content

Commit 2801077

Browse files
committed
adding print statements for debug on AWS
1 parent 2578dec commit 2801077

1 file changed

Lines changed: 10 additions & 1 deletion

File tree

build/broad_sanger/05b_separate_datasets.py

Lines changed: 10 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,6 +5,12 @@
55
import shutil
66

77
def main():
8+
9+
print("ls:\n")
10+
files = os.listdir(".")
11+
print(files)
12+
print("\n")
13+
814
datasets_to_process = ["CCLE", "CTRPv2", "PRISM", "GDSCv1", "GDSCv2", "FIMM", "gCSI", "NCI60"]
915
omics_datatypes = ["transcriptomics","proteomics", "copy_number","mutations"] # csv
1016
samples_datatypes = ["samples"] #csv
@@ -71,12 +77,15 @@ def main():
7177
#One by one, filter other Omics files, write to file, delete from mem.
7278
for omics in omics_datatypes:
7379
ds = dataset_sources[dataset][0]
74-
#print(ds)
80+
print(f"ds: {ds}")
7581
omics_filename_in = f"{ds}_{omics}.csv"
82+
print(f"omics_filename_in: {omics_filename_in}")
7683
if os.path.isfile(omics_filename_in + ".gz"):
7784
omics_filename_in += ".gz"
85+
print(f"omics_filename_in: {omics_filename_in}")
7886

7987
omics_filename_out = f"/tmp/{dataset}_{omics}.csv".lower()
88+
print(f"omics_filename_out: {omics_filename_out}")
8089
omics_df = pl.read_csv(omics_filename_in)
8190
omics_df = omics_df.filter(pl.col("improve_sample_id").is_in(exp_improve_sample_ids))
8291
# omics_df = omics_df.filter(pl.col("source").is_in(dataset_sources[dataset]))

0 commit comments

Comments
 (0)