-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathfastp_fastqc_single-end.nf
77 lines (57 loc) · 1.64 KB
/
fastp_fastqc_single-end.nf
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
#!/usr/bin/env nextflow
/*
* Defines pipeline parameters in order to specify the refence genomes
* and read pairs by using the command line options
*/
params.reads = "$baseDir/data/fastq/*fastq.gz"
Channel
.fromPath( params.reads )
.ifEmpty { error "Cannot find any reads matching: ${params.reads}" }
.map { file -> tuple(file.simpleName, file) }
.into { reads; fastqc_reads }
/*
* QC raw reads
*/
process preFastqc {
publishDir "$baseDir/results/fastqc/pre/"
input:
set val(dataset_id), file(r1) from fastqc_reads
output:
file "*_fastqc.{zip,html}" into raw_fastqc_results
module 'singularity'
script:
"""
singularity run -B /zfs,/scratch2 ~/singularity_containers/fastqc.simg -q ${r1}
"""
}
/*
* Clean the reads
*/
process cleanReads {
publishDir "$baseDir/data/fastq/trimmed/"
input:
set val(dataset_id), file(forward) from reads
output:
set dataset_id, file("${dataset_id}.TRIMMED.fq.gz") into trimmed_reads
module 'singularity'
clusterOptions = '-l select=1:ncpus=4:mem=5gb,walltime=08:00:00'
script:
"""
singularity run -B /zfs,/scratch2 ~/singularity_containers/fastp.simg --length_required=80 --thread=4 --in1=${forward} --out1=${dataset_id}.TRIMMED.fq.gz
"""
}
/*
* QC trimmed reads
*/
process postFastqc {
publishDir "results/fastqc/post/"
input:
set val(dataset_id), file(r1) from trimmed_reads
output:
file "*_fastqc.{zip,html}" into trimmed_fastqc_results
module 'singularity'
script:
"""
singularity run -B /zfs,/scratch2 ~/singularity_containers/fastqc.simg -q ${r1}
"""
}