From 0c1bbd59bbd87b6e99b36d4b17b91f841a162406 Mon Sep 17 00:00:00 2001 From: Laurent Modolo <laurent.modolo@ens-lyon.fr> Date: Wed, 22 Aug 2018 15:37:08 +0200 Subject: [PATCH] Kallisto: update nf structure --- src/nf_modules/Kallisto/indexing.config | 26 ++++ .../Kallisto/{tests/index.nf => indexing.nf} | 3 +- src/nf_modules/Kallisto/kallisto.nf | 123 ------------------ ...{kallisto.config => mapping_paired.config} | 14 -- .../Kallisto/{tests => }/mapping_paired.nf | 0 src/nf_modules/Kallisto/mapping_single.config | 26 ++++ .../Kallisto/{tests => }/mapping_single.nf | 0 src/nf_modules/Kallisto/{tests => }/tests.sh | 12 +- 8 files changed, 60 insertions(+), 144 deletions(-) create mode 100644 src/nf_modules/Kallisto/indexing.config rename src/nf_modules/Kallisto/{tests/index.nf => indexing.nf} (83%) delete mode 100644 src/nf_modules/Kallisto/kallisto.nf rename src/nf_modules/Kallisto/{kallisto.config => mapping_paired.config} (57%) rename src/nf_modules/Kallisto/{tests => }/mapping_paired.nf (100%) create mode 100644 src/nf_modules/Kallisto/mapping_single.config rename src/nf_modules/Kallisto/{tests => }/mapping_single.nf (100%) rename src/nf_modules/Kallisto/{tests => }/tests.sh (50%) diff --git a/src/nf_modules/Kallisto/indexing.config b/src/nf_modules/Kallisto/indexing.config new file mode 100644 index 00000000..94c14cd2 --- /dev/null +++ b/src/nf_modules/Kallisto/indexing.config @@ -0,0 +1,26 @@ +profiles { + docker { + docker.temp = 'auto' + docker.enabled = true + process { + $index_fasta { + container = "kallisto:0.44.0" + } + } + } + sge { + process{ + $index_fasta { + beforeScript = "module purge; module load Kallisto/0.44.0" + executor = "sge" + cpus = 1 + memory = "5GB" + time = "6h" + queueSize = 1000 + pollInterval = '60sec' + queue = 'h6-E5-2667v4deb128' + penv = 'openmp8' + } + } + } +} diff --git a/src/nf_modules/Kallisto/tests/index.nf b/src/nf_modules/Kallisto/indexing.nf similarity index 83% rename from src/nf_modules/Kallisto/tests/index.nf rename to src/nf_modules/Kallisto/indexing.nf index cae4bb03..9e38260f 100644 --- a/src/nf_modules/Kallisto/tests/index.nf +++ b/src/nf_modules/Kallisto/indexing.nf @@ -17,11 +17,12 @@ process index_fasta { output: file "*.index*" into index_files + file "*_kallisto_report.txt" into index_files_report script: """ kallisto index -k 31 --make-unique -i ${fasta.baseName}.index ${fasta} \ -> ${fasta.baseName}_kallisto_report.txt +2> ${fasta.baseName}_kallisto_report.txt """ } diff --git a/src/nf_modules/Kallisto/kallisto.nf b/src/nf_modules/Kallisto/kallisto.nf deleted file mode 100644 index ae6b6b71..00000000 --- a/src/nf_modules/Kallisto/kallisto.nf +++ /dev/null @@ -1,123 +0,0 @@ -/* -* Kallisto : -* Imputs : fastq files -* Imputs : fasta files -* Output : bam files -*/ - -/* fasta indexing */ -params.fasta = "$baseDir/data/bam/*.fasta" - -log.info "fasta files : ${params.fasta}" - -Channel - .fromPath( params.fasta ) - .ifEmpty { error "Cannot find any fasta files matching: ${params.fasta}" } - .set { fasta_file } - -process index_fasta { - tag "$fasta.baseName" - publishDir "results/mapping/index/", mode: 'copy' - - input: - file fasta from fasta_file - - output: - file "*.index*" into index_files - - script: -""" -kallisto index -k 31 --make-unique -i ${fasta.baseName}.index ${fasta} \ -> ${fasta.baseName}_kallisto_report.txt -""" -} - - -/* -* for paired-end data -*/ - -params.fastq = "$baseDir/data/fastq/*_{1,2}.fastq" -params.index = "$baseDir/data/index/*.index.*" - -log.info "fastq files : ${params.fastq}" -log.info "index files : ${params.index}" - -Channel - .fromFilePairs( params.fastq ) - .ifEmpty { error "Cannot find any fastq files matching: ${params.fastq}" } - .set { fastq_files } -Channel - .fromPath( params.index ) - .ifEmpty { error "Cannot find any index files matching: ${params.index}" } - .set { index_files } - -process mapping_fastq { - tag "$reads" - cpus 4 - publishDir "results/mapping/quantification/", mode: 'copy' - - input: - set pair_id, file(reads) from fastq_files - file index from index_files.collect() - - output: - file "*" into counts_files - - script: -""" -mkdir ${reads[0].baseName} -kallisto quant -i ${index} -t ${task.cpus} \ ---bias --bootstrap-samples 100 -o ${pair_id} \ -${reads[0]} ${reads[1]} &> ${pair_id}_kallisto_report.txt -""" -} - - -/* -* for single-end data -*/ - -params.fastq = "$baseDir/data/fastq/*.fastq" -params.index = "$baseDir/data/index/*.index*" -params.mean = 200 -params.sd = 100 - -log.info "fastq files : ${params.fastq}" -log.info "index files : ${params.index}" -log.info "mean read size: ${params.mean}" -log.info "sd read size: ${params.sd}" - -Channel - .fromPath( params.fastq ) - .ifEmpty { error "Cannot find any fastq files matching: ${params.fastq}" } - .map { it -> [(it.baseName =~ /([^\.]*)/)[0][1], it]} - .set { fastq_files } -Channel - .fromPath( params.index ) - .ifEmpty { error "Cannot find any index files matching: ${params.index}" } - .set { index_files } - -process mapping_fastq { - tag "$file_id" - cpus 4 - publishDir "results/mapping/quantification/", mode: 'copy' - - input: - set file_id, file(reads) from fastq_files - file index from index_files.collect() - - output: - file "*" into count_files - - script: -""" -mkdir ${file_id} -kallisto quant -i ${index} -t ${task.cpus} --single \ ---bias --bootstrap-samples 100 -o ${file_id} \ --l ${params.mean} -s ${params.sd} \ -${reads} > ${file_id}_kallisto_report.txt -""" -} - - diff --git a/src/nf_modules/Kallisto/kallisto.config b/src/nf_modules/Kallisto/mapping_paired.config similarity index 57% rename from src/nf_modules/Kallisto/kallisto.config rename to src/nf_modules/Kallisto/mapping_paired.config index da7f54e0..de674527 100644 --- a/src/nf_modules/Kallisto/kallisto.config +++ b/src/nf_modules/Kallisto/mapping_paired.config @@ -3,9 +3,6 @@ profiles { docker.temp = 'auto' docker.enabled = true process { - $index_fasta { - container = "kallisto:0.44.0" - } $mapping_fastq { container = "kallisto:0.44.0" } @@ -13,17 +10,6 @@ profiles { } sge { process{ - $index_fasta { - beforeScript = "module purge; module load Kallisto/0.44.0" - executor = "sge" - cpus = 1 - memory = "5GB" - time = "6h" - queueSize = 1000 - pollInterval = '60sec' - queue = 'h6-E5-2667v4deb128' - penv = 'openmp8' - } $mapping_fastq { beforeScript = "module purge; module load Kallisto/0.44.0" executor = "sge" diff --git a/src/nf_modules/Kallisto/tests/mapping_paired.nf b/src/nf_modules/Kallisto/mapping_paired.nf similarity index 100% rename from src/nf_modules/Kallisto/tests/mapping_paired.nf rename to src/nf_modules/Kallisto/mapping_paired.nf diff --git a/src/nf_modules/Kallisto/mapping_single.config b/src/nf_modules/Kallisto/mapping_single.config new file mode 100644 index 00000000..de674527 --- /dev/null +++ b/src/nf_modules/Kallisto/mapping_single.config @@ -0,0 +1,26 @@ +profiles { + docker { + docker.temp = 'auto' + docker.enabled = true + process { + $mapping_fastq { + container = "kallisto:0.44.0" + } + } + } + sge { + process{ + $mapping_fastq { + beforeScript = "module purge; module load Kallisto/0.44.0" + executor = "sge" + cpus = 4 + memory = "5GB" + time = "6h" + queueSize = 1000 + pollInterval = '60sec' + queue = 'h6-E5-2667v4deb128' + penv = 'openmp8' + } + } + } +} diff --git a/src/nf_modules/Kallisto/tests/mapping_single.nf b/src/nf_modules/Kallisto/mapping_single.nf similarity index 100% rename from src/nf_modules/Kallisto/tests/mapping_single.nf rename to src/nf_modules/Kallisto/mapping_single.nf diff --git a/src/nf_modules/Kallisto/tests/tests.sh b/src/nf_modules/Kallisto/tests.sh similarity index 50% rename from src/nf_modules/Kallisto/tests/tests.sh rename to src/nf_modules/Kallisto/tests.sh index f83a4cac..ec20292e 100755 --- a/src/nf_modules/Kallisto/tests/tests.sh +++ b/src/nf_modules/Kallisto/tests.sh @@ -1,16 +1,16 @@ -nextflow src/nf_modules/Kallisto/tests/index.nf \ - -c src/nf_modules/Kallisto/kallisto.config \ +nextflow src/nf_modules/Kallisto/indexing.nf \ + -c src/nf_modules/Kallisto/indexing.config \ -profile docker \ --fasta "data/tiny_dataset/fasta/tiny_v2.fasta" -nextflow src/nf_modules/Kallisto/tests/mapping_single.nf \ - -c src/nf_modules/Kallisto/kallisto.config \ +nextflow src/nf_modules/Kallisto/mapping_single.nf \ + -c src/nf_modules/Kallisto/mapping_single.config \ -profile docker \ --index "results/mapping/index/tiny_v2.index" \ --fastq "data/tiny_dataset/fastq/tiny*_S.fastq" -nextflow src/nf_modules/Kallisto/tests/mapping_paired.nf \ - -c src/nf_modules/Kallisto/kallisto.config \ +nextflow src/nf_modules/Kallisto/mapping_paired.nf \ + -c src/nf_modules/Kallisto/mapping_paired.config \ -profile docker \ --index "results/mapping/index/tiny_v2.index" \ --fastq "data/tiny_dataset/fastq/tiny*_R{1,2}.fastq" -- GitLab