Skip to content

Commit 85fd780

Browse files
committed
Update build configuration schema (JSON).
1 parent 74bc441 commit 85fd780

File tree

2 files changed

+80
-121
lines changed

2 files changed

+80
-121
lines changed
Lines changed: 80 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,80 @@
1+
{
2+
"$schema": "buildConfigurationSchema.json",
3+
"title": "MUSIAL v2.4 build configuration",
4+
"description": "JSON schema to validate and document the MUSIAL build task parameters.",
5+
"type": "object",
6+
"properties": {
7+
"minimalCoverage": {
8+
"description": "The minimal depth of coverage wrt. reads of a variant to be accepted.",
9+
"type": "integer",
10+
"minimum": 0
11+
},
12+
"minimalFrequency": {
13+
"description": "The minimal frequency wrt. reads supporting a nucleotide variant call for a variant to be accepted.",
14+
"type": "number",
15+
"minimum": 0.0,
16+
"maximum": 1.0
17+
},
18+
"storeFiltered": {
19+
"description": "If set to true, calls that are filtered by coverage and frequency restrictions are retained as ambiguous variants (N).",
20+
"type": "boolean"
21+
},
22+
"skipSnpEff": {
23+
"description": "If set to true, SnpEff analysis will be skipped.",
24+
"type": "boolean"
25+
},
26+
"skipProteoformInference": {
27+
"description": "If set to true, proteoform inference will be skipped.",
28+
"type": "boolean"
29+
},
30+
"excludedPositions": {
31+
"description": "Path to a BED file (no header row, rows starting with # are ignored); Only obligatory columns one (chrom), two (start) and three (end) are considered. Specification of positions to be excluded from the analysis.",
32+
"type": "string",
33+
"pattern": "^.+.bed|.+.tsv|.+.csv$"
34+
},
35+
"excludedVariants": {
36+
"description": "Path to a .tsv file (no header row, rows starting with # are ignored); The file is expected to contain four columns (chrom, pos, ref, alt). Specification of variants to be excluded from the analysis",
37+
"type": "string",
38+
"pattern": "^.+.tsv|.+.csv$"
39+
},
40+
"reference": {
41+
"description": "Path to a FASTA file. Content will be used as the reference sequences.",
42+
"type": "string",
43+
"pattern": "^.+.fasta|.+.fas|.+.fa$"
44+
},
45+
"annotation": {
46+
"description": "Path to a GFF3 file; Content will be used as reference sequences feature annotation.",
47+
"type": "string",
48+
"pattern": "^.+.gff3|.+.gff$"
49+
},
50+
"output": {
51+
"description": "Path to directory or file to write the output file (storage) to.",
52+
"type": "string",
53+
"pattern": "^.+$"
54+
},
55+
"vcfInput": {
56+
"description": "List of files or directories specifying the samples (VCF files) to be analyzed.",
57+
"type": "array",
58+
"uniqueItems": true,
59+
"minItems": 1,
60+
"items": {
61+
"type": "string"
62+
}
63+
},
64+
"vcfMeta": {
65+
"description": "Path to a .tsv or .csv file specifying sample annotations. The file is expected to contain a header row with the first column representing the sample names (matching to the `variantCalls` genotype fields). The remaining columns can be arbitrary.",
66+
"type": "string",
67+
"pattern": "^.+.tsv|.+.csv$"
68+
},
69+
"features": {
70+
"description": "Path to a .tsv or .csv file (no header row, rows starting with # are ignored) specifying the set of reference features to analyze. The file is expected to contain two columns representing the attribute key and value to match the feature from, i.e., key/value pairs of any property in the last column of the provided GFF3 file. An optional third column can be used to specify additional attributes in the notation KEY=VALUE;...",
71+
"type": "string",
72+
"pattern": "^.+.tsv|.+.csv$"
73+
}
74+
},
75+
"required": [
76+
"output",
77+
"vcfInput"
78+
],
79+
"additionalProperties": false
80+
}

src/main/resources/musial_build_configuration.schema.json

Lines changed: 0 additions & 121 deletions
This file was deleted.

0 commit comments

Comments
 (0)