pipeline_building_cec.md

nextflow.enable.dsl=2
include { fastp } from "./nf_modules/fastp/main.nf"
channel
  .fromFilePairs( "data/tiny_dataset/fastq/*_R{1,2}.fastq", size: -1)
  .set { fastq_files }
workflow {
  fastp(fastq_files)
}
params.fastq = "data/fastq/*_{1,2}.fastq"
channel
  .fromFilePairs( params.fastq, size: -1)
  .set { fastq_files }
log.info "fastq files: ${params.fastq}"
include { index_fasta; mapping_fastq } from './nf_modules/kallisto/main.nf'
log.info "fasta file : ${params.fasta}"  # to display the value of the variable

channel
  .fromPath( params.fasta )
  .ifEmpty { error "Cannot find any fasta files matching: ${params.fasta}" }
  .map { it -> [it.simpleName, it]}
  .set { fasta_file }
workflow {
  fastp(fastq_files)
  index_fasta(fasta_file)
}
workflow {
  fastp(fastq_files)
  index_fasta(fasta_file)
  mapping_fastq(index_fasta.out.index.collect(), fastp.out.fastq)  //.collect to reuse the same index for each fastq file
}
include { index_fasta; mapping_fastq } from './nf_modules/kallisto/main.nf' addParams( mapping_fastq: " -l mean_frag_size -s sd_value ")
include { index_fasta; mapping_fastq } from './nf_modules/bowtie2/main.nf'
log.info "fasta file : ${params.fasta}"  # to display the value of the variable

channel
  .fromPath( params.fasta )
  .ifEmpty { error "Cannot find any fasta files matching: ${params.fasta}" }
  .map { it -> [it.simpleName, it]}
  .set { fasta_file }
workflow {
  fastp(fastq_files)
  index_fasta(fasta_file)
}
workflow {
  fastp(fastq_files)
  index_fasta(fasta_file)
  mapping_fastq(index_fasta.out.index.collect(), fastp.out.fastq)
}
params.<process_name>_out = "path"
include { fastp } from './nf_modules/fastp/main.nf' addParams(fastp_out: "fastQC/")
include { index_fasta; mapping_fastq } from './nf_modules/kallisto/main.nf' addParams(mapping_fastq: " -l mean_frag_size -s sd_value ", mapping_fastq_out: "quantification/")
or include { index_fasta; mapping_fastq } from './nf_modules/bowtie2/main.nf' addParams(mapping_fastq_out: "alignment")
  log.info "fasta file : ${params.cds_fasta}" for kallisto which uses c_elegans.PRJNA13758.WS278.all_transcripts.fa
  log.info "fasta file : ${params.genomic_fasta}" for bowtie2 which uses c_elegans.PRJNA13758.WS278.genomic.fa
channel
  .fromPath( params.cds_fasta )
  .ifEmpty { error "Cannot find any fasta files matching: ${params.cds_fasta}" }
  .map { it -> [it.simpleName, it]}
  .set { cds_fasta_file }

channel
  .fromPath( params.genomic_fasta )
  .ifEmpty { error "Cannot find any fasta files matching: ${params.genomic_fasta}" }
  .map { it -> [it.simpleName, it]}
  .set { genomic_fasta_file }
include {
  index_fasta as kallisto_index_fasta;
  mapping_fastq as kallisto_mapping_fastq
 } from './nf_modules/kallisto/main.nf' addParams( mapping_fastq_out: "quantif/", mapping_fastq: " -l 459.8 -s 198.5 ")

include {
  index_fasta as bowtie_index_fasta;
  mapping_fastq as bowtie_mapping_fastq
} from './nf_modules/bowtie2/main.nf' addParams(mapping_fastq_out: "align/")
workflow {
  fastp(fastq_files)
  kallisto_index_fasta(cds_fasta_file)
  kallisto_mapping_fastq(kallisto_index_fasta.out.index.collect(), fastp.out.fastq)  //.collect pour réutiliser l'index pour chaque fastq file
  bowtie_index_fasta(genomic_fasta_file)
  bowtie_mapping_fastq(bowtie_index_fasta.out.index.collect(), fastp.out.fastq)
          }
login@allo-psmn
login@cl6242comp2
mkdir -p /scratch/Bio/<login>
cd /scratch/Bio/<login>
git clone https://gitbio.ens-lyon.fr/<usr_name>/nextflow.git
cd nextflow/data
git clone https://gitbio.ens-lyon.fr/LBMC/hub/tiny_dataset.git
cd ..
./nextflow run src/RNAseq_cec.nf \
        -profile psmn \
        --fastq "data/*.fastq" \
        --cds_fasta "data/c_elegans.PRJNA13758.WS278.all_transcripts.fa" \
        --genomic_fasta "data/c_elegans.PRJNA13758.WS278.genomic.fa"

src/install_nextflow.sh
  screen -S rnaseq # to create the rnaseq screen
  src/RNAseq_script.sh # to launch the script
  screen -r rnaseq #to reattach the screen