From e54720be08d3a4998a392e196c665d67a9347c9d Mon Sep 17 00:00:00 2001 From: Laurent Modolo <laurent.modolo@ens-lyon.fr> Date: Wed, 5 May 2021 14:36:41 +0200 Subject: [PATCH] alntools: update transcript lengths computation --- src/nf_modules/alntools/main.nf | 15 +++++++-------- 1 file changed, 7 insertions(+), 8 deletions(-) diff --git a/src/nf_modules/alntools/main.nf b/src/nf_modules/alntools/main.nf index 8813a050..ef1e879e 100644 --- a/src/nf_modules/alntools/main.nf +++ b/src/nf_modules/alntools/main.nf @@ -21,17 +21,16 @@ process bam2ec { script: """ -awk -F"\t" ' -\$3=="exon" - { - ID=substr(\$9, length(\$9)-16, 15); - L[ID]+=\$5-\$4+1 +awk -F"[\t;]" ' +\$3=="exon" { + ID=gensub(/transcript_id \"(.*)\"/, "\\1", "g", \$11); + LEN[ID]+=\$5-\$4+1; } END{ - for(i in L) - {print i"\t"L[i]} + for(i in LEN) + {print i"\t"LEN[i]} } -' ${gtf} ${gtf.simpleName}_transcripts_lengths.tsv +' ${gtf} > ${gtf.simpleName}_transcripts_lengths.tsv alntools bam2ec ${params.bam2sec} -t ${gtf.simpleName}_transcripts_lengths.tsv -c 8 ${bam} ${bam.simpleName}.bin """ } \ No newline at end of file -- GitLab