diff --git a/.gitignore b/.gitignore index d88c0bcbf31e519a61c630f9b4a0884cbfea6b38..b03679d775baf376284abd55a42e56689723de5d 100644 --- a/.gitignore +++ b/.gitignore @@ -9,3 +9,10 @@ src/mergekmer .Rhistory .Rprofile .kmer-diff.Rproj +.Rbuildignore +doc/2023_09_18_presentation.html +doc/2023_09_18_presentation_files/ +doc/presentation_files/ +fail.txt +kmer-diff.Rproj +src/plot_counts.Rmd diff --git a/src/modules/sample_reads.nf b/src/modules/sample_reads.nf index 6bce0b3ba53e13c562448f1ab67493ec114ed9a4..e10d4ec25107c9302dd59852a5e3d07d1a0d8423 100644 --- a/src/modules/sample_reads.nf +++ b/src/modules/sample_reads.nf @@ -120,10 +120,18 @@ process SAMPLE_READS { error "SEQTK/SAMPLE must have a sample_size value included" } """ - if [\$(cat $sample_size | tr -d '\\n') -eq \$(cat $read_number | tr -d '\\n')]; then + SAMPLE_SIZE=\$((cat $sample_size | tr -d '\\n')) + CURRENT_READ_NUMBER=\$((cat $read_number | tr -d '\\n')) + + if [\$SAMPLE_SIZE -eq \$CURRENT_READ_NUMBER]; then ln -s ${reads} sample_${reads} + READ_NUMBER=\$((cat $sample_size | tr -d '\\n')) else - zcat ${reads} | head -n \$(cat $sample_size | tr -d '\\n') | gzip -c > sample_${reads} + zcat ${reads} | head -n \$((cat $sample_size | tr -d '\\n')) | gzip -c > sample_${reads} + READ_NUMBER=\$((zcat sample_${reads} | wc -l)) + fi + if [\$SAMPLE_SIZE -ne \$READ_NUMBER]; then + exit 1 fi cat <<-END_VERSIONS > versions.yml diff --git a/src/modules/split.nf b/src/modules/split.nf index a6cf5fe04c30b347a2f7a45b7c89d81a8c40825e..9a8b72ff3893b04bef17087494d10f56f84dbb63 100644 --- a/src/modules/split.nf +++ b/src/modules/split.nf @@ -16,6 +16,9 @@ process SPLIT { """ zcat ${fastq} | split -l 4000000 - ${fastq.simpleName}_ + ls -l ${fastq.simpleName}_* | \\ + awk '{system("if [\$((wc -l "\$9")) -ne 4000000]; then exit 1; fi")}' + ls -l ${fastq.simpleName}_* | \\ awk '{system("gzip -c "\$9" > "\$9".fastq.gz && rm "\$9)}'