From c441cecdb9b1b17a2782b4b2dd4c61656e471e29 Mon Sep 17 00:00:00 2001
From: Laurent Modolo <laurent.modolo@ens-lyon.fr>
Date: Thu, 12 Oct 2023 16:01:49 +0200
Subject: [PATCH] run.sh: add resume tag

---
 run.sh | 33 +++++++++++++++++++++++++++++++++
 1 file changed, 33 insertions(+)
 create mode 100644 run.sh

diff --git a/run.sh b/run.sh
new file mode 100644
index 0000000..a6ff9bd
--- /dev/null
+++ b/run.sh
@@ -0,0 +1,33 @@
+cd data/
+# Download the fastq
+awk '{system("fasterq-dump "$0)}' SRR_Acc_List.txt
+ls -l *.fastq \
+    | awk '{system("gzip "$9)}'
+
+# Download the fasta
+aws s3 --no-sign-request --region eu-west-1 sync s3://ngi-igenomes/igenomes/Homo_sapiens/Ensembl/GRCh37/Sequence/WholeGenomeFasta/ ./GRCh37/
+aws s3 --no-sign-request --region eu-west-1 sync s3://ngi-igenomes/igenomes/Mus_musculus/Ensembl/GRCm38/Sequence/WholeGenomeFasta/ ./GRCm38/
+
+# Concatenate the fasta
+
+cat GRCh37/genome.fa \
+    | sed -E 's/(>.*)/\1_GRCh37/g' \
+    > GRCh37_GRCm38_mix.fa
+cat GRCm38/genome.fa \
+    | sed -E 's/(>.*)/\1_GRCm38/g' \
+    >> GRCh37_GRCm38_mix.fa
+
+cd ../
+
+nextflow run main.nf \
+   -profile psmn \
+   --workflow hicpro \
+   --input data/sample.csv \
+   --fasta data/GRCh37_GRCm38_mix.fa \
+   --outdir results/ \
+   --digestion hindiii \
+   --keep_dups \
+   --filter_pcr_picard \
+   -resume
+
+
-- 
GitLab