-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathmain.sh
48 lines (41 loc) · 1.57 KB
/
main.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
#!/bin/bash
#change to home directory
cd SageMaker
#create necessary folders
mkdir metadata
mkdir metadata/methylation_data #no cloud link for this
mkdir data/encode_data/bigWigs -p
mkdir results
mkdir results/adata_dependencies
mkdir results/models
mkdir results/enrichment
mkdir figures
#download Ensembl 105 from an R script
source activate R
Rscript scripts/Ensembl-105-EnsDb-for-Homo-sapiens.r
conda deactivate
#download metadata for the 27k and 450k Illumina DNA methylation arrays
wget https://zhouserver.research.chop.edu/InfiniumAnnotation/20180909/HM27/HM27.hg38.manifest.tsv.gz -P metadata
wget https://zhouserver.research.chop.edu/InfiniumAnnotation/20180909/HM450/HM450.hg38.manifest.tsv.gz -P metadata
#install required python packages
source activate python3
mamba install -c conda-forge -c bioconda gseapy -y
mamba install -c bioconda pybigwig -y
mamba install -c conda-forge dynamo-release -y
pip install -r requirements.txt
#download data
python scripts/download_and_process_methylation.py
python scripts/download_and_process_encode.py
python scripts/download_and_process_encode_imputation.py
python scripts/download_and_process_encode_primary_cells_untreated.py
#run scripts
python scripts/nested_cv.py
python scripts/nested_cv_adult_only.py
python scripts/nested_cv_sim_methylation.py
python scripts/nested_cv_pan_histone.py
python scripts/nested_cv_noise.py
python scripts/nested_cv_across_histones.py
python scripts/nested_cv_across_histones_flipped.py
python scripts/nested_cv_across_histone_group.py
python scripts/train_histone_models.py
python scripts/train_pan_histone_model.py