@@ -14,14 +14,16 @@ First we get the packages loaded and logged into synapse.
1414knitr::opts_chunk$set(echo = TRUE)
1515library(tidyverse)
1616library(ggplot2)
17- source('coderdataResultsFunctions.R')
17+ library(arrow)
18+ library(dplyr)
1819
20+ source('coderdataResultsFunctions.R')
1921```
2022
2123
2224The data has been uploaded by natasha and can be downloaded as follows.
2325
24- ``` {r download data}
26+ ``` {r download data, eval }
2527
2628 cdres <- getModelPerformanceData()
2729
@@ -33,7 +35,7 @@ The data has been uploaded by natasha and can be downloaded as follows.
3335## Figure 4A
3436
3537
36- ``` {r}
38+ ``` {r, eval=FALSE }
3739metrics <- c('scc','pcc')
3840exres = lapply(metrics,function(x) {
3941 res<-ridgelineMetricPlots(x, ecdres,'cellline')
@@ -47,7 +49,7 @@ print(exres)
4749
4850Now we can confirm that the datasets follow the same pattern.
4951
50- ``` {r dataset samples}
52+ ``` {r dataset samples, eval=FALSE }
5153
5254
5355plot<-calcSourceStatistics('scc',ecdres)
@@ -61,7 +63,25 @@ print(plot)
6163## Create funtion to dive in
6264
6365
66+ Full model predictions are stored on synapse as parquet files. Individual
67+ datasets can be downloaded via ` getModelPredictionData ` in
68+ ` coderdataResultsFunctions.R ` (sources during the setup process).
69+ ``` {r lgbm data import}
6470
65- ``` {r}
71+ lgbm_all_preds <- getModelPredictionData(dset = "lgbm")
6672
6773```
74+
75+ ``` {r subsetting data}
76+ query <- lgbm_all_preds |>
77+ dplyr::filter(target == 'mpnst')
78+
79+ mpnst_response_data <- query |> collect()
80+ ```
81+
82+ ``` {r}
83+ options(repr.plot.width = 5, repr.plot.height = 15)
84+ plot <- ggplot(mpnst_response_data, aes(x=auc_true, y=auc_pred)) + geom_point() + geom_smooth(method=lm) + facet_grid(source ~ .)
85+ ggsave('mpnst_auc_plot.pdf', plot, dpi=300, width=5, height=20)
86+ ```
87+
0 commit comments