Skip to content

Commit b7dcd6b

Browse files
changes to build liverpdo dataset
1 parent f2f6e52 commit b7dcd6b

4 files changed

Lines changed: 94 additions & 3 deletions

File tree

build/build_dataset.py

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -48,7 +48,8 @@ def process_docker(dataset,validate):
4848
'genes': ['genes'],
4949
'upload': ['upload'],
5050
'crcpdo': ['crcpdo'],
51-
'bladderpdo': ['bladderpdo']
51+
'bladderpdo': ['bladderpdo'],
52+
'liverpdo': ['liverpdo']
5253
}
5354

5455
# Collect container names to build based on the dataset provided. Always build 'genes'.
@@ -131,7 +132,8 @@ def process_omics(executor, dataset, should_continue):
131132
'sarcpdo': ['mutations', 'transcriptomics'],
132133
'pancpdo': ['transcriptomics'],
133134
'bladderpdo': ['copy_number', 'mutations', 'transcriptomics'],
134-
'crcpdo':['copy_number', 'mutations', 'transcriptomics']
135+
'crcpdo':['copy_number', 'mutations', 'transcriptomics'],
136+
'liverpdo':['copy_number', 'mutations', 'transcriptomics']
135137
}
136138

137139
expected_omics = dataset_omics_files.get(dataset, [])

build/docker/Dockerfile.liverpdo

Lines changed: 61 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,61 @@
1+
FROM r-base:4.4.1
2+
3+
ENV DEBIAN_FRONTEND=noninteractive
4+
5+
# Update package list and install required packages
6+
RUN apt-get update && \
7+
apt-get install -y build-essential wget curl libcurl4-openssl-dev libxml2-dev \
8+
zlib1g-dev libssl-dev libbz2-dev libreadline-dev libsqlite3-dev libffi-dev
9+
10+
# Download and compile Python 3.10 with shared library support
11+
RUN wget https://www.python.org/ftp/python/3.10.12/Python-3.10.12.tgz && \
12+
tar -xf Python-3.10.12.tgz && \
13+
cd Python-3.10.12 && \
14+
./configure --enable-optimizations --enable-shared && \
15+
make -j$(nproc) && \
16+
make altinstall && \
17+
cd .. && \
18+
rm -rf Python-3.10.12.tgz Python-3.10.12
19+
20+
# Set Python 3.10 as default
21+
RUN ln -s /usr/local/bin/python3.10 /usr/bin/python3 && \
22+
ln -s /usr/local/bin/pip3.10 /usr/bin/pip3
23+
24+
# Update library paths for Python shared library
25+
RUN echo "/usr/local/lib" >> /etc/ld.so.conf.d/python3.10.conf && ldconfig
26+
27+
# Create a Python virtual environment
28+
#RUN python3 -m venv /opt/venv
29+
#RUN /opt/venv/bin/pip install --upgrade pip
30+
31+
# Set environment variables for reticulate
32+
#ENV RETICULATE_PYTHON="/opt/venv/bin/python3"
33+
ENV PYTHONPATH=/app#"${PYTHONPATH}:/app"
34+
WORKDIR /app
35+
36+
# Set MPLCONFIGDIR to a writable directory and create it.
37+
ENV MPLCONFIGDIR=/app/tmp/matplotlib
38+
RUN mkdir -p /app/tmp/matplotlib
39+
40+
41+
ADD build/liverpdo/requirements.R .
42+
# installing r libraries
43+
RUN Rscript requirements.R
44+
45+
46+
47+
# installing python libraries
48+
ADD build/liverpdo/requirements.txt .
49+
#RUN /opt/venv/bin/pip3 install -r requirements.txt
50+
RUN pip3 install -r requirements.txt
51+
52+
RUN python3 --version
53+
RUN which Rscript
54+
55+
#ENV PATH="/opt/venv/bin:$PATH"
56+
57+
ADD build/liverpdo/CNV-segfile-annotation.R ./
58+
ADD build/liverpdo/*py ./
59+
ADD build/liverpdo/*sh ./
60+
61+
ADD build/utils/* ./

build/docker/docker-compose.yml

Lines changed: 10 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -112,4 +112,13 @@ services:
112112
args:
113113
HTTPS_PROXY: ${HTTPS_PROXY}
114114
platform: linux/amd64
115-
image: crcpdo:latest
115+
image: crcpdo:latest
116+
117+
liverpdo:
118+
build:
119+
context: ../../
120+
dockerfile: build/docker/Dockerfile.liverpdo
121+
args:
122+
HTTPS_PROXY: ${HTTPS_PROXY}
123+
platform: linux/amd64
124+
image: liverpdo:latest

build/liverpdo/requirements.txt

Lines changed: 19 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,19 @@
1+
pandas
2+
numpy==1.23
3+
#os
4+
#gzip
5+
requests
6+
argparse
7+
synapseclient
8+
matplotlib
9+
#math
10+
#time
11+
#threading
12+
#signal
13+
rdkit
14+
mordred
15+
#multiprocessing
16+
tqdm
17+
#itertools
18+
scikit-learn
19+
openpyxl

0 commit comments

Comments
 (0)