Skip to content

Commit 0561c64

Browse files
committed
add vv raw reads stub, fix configs
1 parent ead77cb commit 0561c64

File tree

3 files changed

+22
-57
lines changed

3 files changed

+22
-57
lines changed

RNAseq/Workflow_Documentation/NF_RCP/workflow_code/conf/by_docker_image.config

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -60,7 +60,7 @@ process {
6060
container = "quay.io/biocontainers/rsem:1.3.3--pl526ha52163a_0"
6161
}
6262

63-
withName: 'GET_ACCESSIONS|FETCH_ISA|ISA_TO_RUNSHEET|RUNSHEET_FROM_ISA|GENERATE_MD5SUMS|SOFTWARE_VERSIONS|UPDATE_ISA_TABLES|PARSE_QC_METRICS|REMOVE_RRNA_FEATURECOUNTS|MD5SUM' {
63+
withName: 'GET_ACCESSIONS|FETCH_ISA|ISA_TO_RUNSHEET|RUNSHEET_FROM_ISA|GENERATE_MD5SUMS|SOFTWARE_VERSIONS|UPDATE_ISA_TABLES|PARSE_QC_METRICS|REMOVE_RRNA_FEATURECOUNTS|MD5SUM' {
6464
container = "quay.io/nasa_genelab/dp_tools:1.3.5"
6565
}
6666

RNAseq/Workflow_Documentation/NF_RCP/workflow_code/conf/slurm.config

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -87,7 +87,7 @@ process {
8787
cpus = { 12 * task.attempt }
8888
memory = { 72.GB * task.attempt }
8989
}
90-
withName:DESEQ2_DGE {
90+
withName:DGE_DESEQ2 {
9191
// To do: Optimize both settings, large dataset wald
9292
cpus = { 4 * task.attempt }
9393
memory = { 16.GB * task.attempt }

RNAseq/Workflow_Documentation/NF_RCP/workflow_code/modules/vv.nf

Lines changed: 20 additions & 55 deletions
Original file line numberDiff line numberDiff line change
@@ -1,80 +1,45 @@
1-
/* VV check processes
2-
* These processes intentional deviate from Nextflow isolation to ensure QC reports
3-
* are based on files in publish directory and not work directories.
4-
*/
5-
6-
// NOTE: first VV step also creates initial VV file that is shared across all vv steps
7-
// process VV_RAW_READS {
8-
// label 'VV'
9-
// // Log publishing
10-
// publishDir "${ publishdir }",
11-
// pattern: "test.txt",
12-
// mode: params.publish_dir_mode
13-
14-
// input:
15-
// val(publishdir)
16-
// val(meta)
17-
// path("Metadata/*_runsheet.csv") // Runsheet
18-
// path("00-RawData/Fastq/*") // Raw reads
19-
// path("00-RawData/FastQC_Reports/*") // Raw FastQC reports
20-
// path("00-RawData/FastQC_Reports/*") // Raw MultiQC report
21-
// path(dp_tools__NF_RCP)
22-
23-
// output:
24-
// path("test.txt"), emit: test
25-
26-
// script:
27-
// """
28-
// echo "Meta: ${meta}" > test.txt
29-
// """
30-
// }
311
process VV_RAW_READS {
32-
// Log publishing
2+
// Publish VV log
333
publishDir "${ publishdir }",
344
pattern: "VV_log.tsv" ,
355
mode: params.publish_dir_mode,
366
saveAs: { "VV_Logs/VV_log_${ task.process.replace(":","-") }${ params.assay_suffix }.tsv" }
37-
// V&V'ed data publishing
7+
// Publish VVed data
388
publishDir "${ publishdir }",
399
pattern: '00-RawData/**',
4010
mode: params.publish_dir_mode
4111

4212
label 'VV'
4313

4414
input:
15+
path(dp_tools__NF_RCP)
4516
val(publishdir)
4617
val(meta)
47-
path("VV_INPUT/Metadata/*") // Runsheet
48-
path("VV_INPUT/00-RawData/Fastq/*") // Raw reads
49-
path("VV_INPUT/00-RawData/FastQC_Reports/*") // Raw FastQC reports
50-
path("VV_INPUT/00-RawData/FastQC_Reports/*") // Unzipped Raw MultiQC report
51-
path("VV_INPUT/00-RawData/FastQC_Reports/*") // Zipped Raw MultiQC report
52-
path(dp_tools__NF_RCP)
18+
path(runsheet) // Runsheet
19+
path("INPUT/raw_fastq/*") // Raw reads
20+
path("INPUT/raw_fastqc/*") // Raw FastQC reports
21+
path("INPUT/raw_multiqc/*") // Unzipped Raw MultiQC report
5322

5423
output:
55-
path("Metadata/*_runsheet.csv"), emit: VVed_runsheet
5624
path("00-RawData/Fastq"), emit: VVed_raw_reads
5725
path("00-RawData/FastQC_Reports/*{_fastqc.html,_fastqc.zip}"), emit: VVed_raw_fastqc
58-
path("00-RawData/FastQC_Reports/raw_multiqc${params.assay_suffix}_report"), emit: VVed_raw_unzipped_multiqc_report
59-
path("00-RawData/FastQC_Reports/raw_multiqc${params.assay_suffix}_report.zip"), emit: VVed_raw_zipped_multiqc_report
26+
path("00-RawData/FastQC_Reports/raw_multiqc${params.assay_suffix}_report"), emit: VVed_raw_unzipped_multiqc_report
27+
//path("00-RawData/FastQC_Reports/raw_multiqc${params.assay_suffix}_report.zip"), emit: VVed_raw_zipped_multiqc_report
6028
path("VV_log.tsv"), optional: params.skipVV, emit: log
6129

6230
script:
6331
"""
64-
# move from VV_INPUT to task directory
65-
# This allows detection as output files for publishing
66-
mv VV_INPUT/* . || true
67-
68-
# Run V&V unless user requests to skip V&V
69-
if ${ !params.skipVV } ; then
70-
dpt validation run ${dp_tools__NF_RCP} . Metadata/*_runsheet.csv \\
71-
--data-asset-key-sets \\
72-
${ meta.paired_end ? "'demuliplexed paired end raw data,qc reports for paired end raw data'" : "'demuliplexed single end raw data,qc reports for single end raw data'"} \\
73-
--run-components \\
74-
'Metadata,Raw Reads,Raw Reads By Sample' \\
75-
--max-flag-code ${ params.max_flag_code } \\
76-
--output VV_log.tsv
77-
fi
32+
mv INPUT/* . || true
33+
vv.py --assay-type rnaseq \
34+
--assay-suffix ${params.assay_suffix} \
35+
--runsheet-path ${runsheet} \
36+
--outdir ${publishdir} \
37+
--paired-end ${meta.paired_end} \
38+
--mode microbes \
39+
--raw-fastq raw_fastq/ \
40+
--raw-fastqc raw_fastqc/ \
41+
--raw-multiqc raw_multiqc/ \
42+
--run-components raw_reads
7843
"""
7944
}
8045

0 commit comments

Comments
 (0)