Skip to content

Commit 2acafd1

Browse files
DriesSchaumontgithub-actions[bot]
authored andcommitted
deploy: e36c057
1 parent e36c057 commit 2acafd1

File tree

923 files changed

+669070
-1
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

923 files changed

+669070
-1
lines changed

.gitignore

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -29,7 +29,6 @@ out/
2929
# viash related
3030
.viash_log*
3131
log.txt
32-
/target/
3332
check_results/
3433
out/
3534
output*
Lines changed: 38 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,38 @@
1+
# Inputs
2+
mode: # please fill in - example: "wta"
3+
id: # please fill in - example: "foo"
4+
input: # please fill in - example: ["input.fastq.gz"]
5+
reference: # please fill in - example: ["reference_genome.tar.gz|reference.fasta"]
6+
# transcriptome_annotation: "transcriptome.gtf"
7+
# abseq_reference: ["abseq_reference.fasta"]
8+
# supplemental_reference: ["supplemental_reference.fasta"]
9+
sample_prefix: "sample"
10+
11+
# Outputs
12+
# output_raw: "$id.$key.output_raw.output_raw"
13+
# output_h5mu: "$id.$key.output_h5mu.h5mu"
14+
15+
# Putative cell calling settings
16+
# putative_cell_call: "mRNA"
17+
# exact_cell_count: 10000
18+
disable_putative_calling: false
19+
20+
# Subsample arguments
21+
# subsample: 0.01
22+
# subsample_seed: 3445
23+
24+
# Multiplex arguments
25+
# sample_tags_version: "human"
26+
# tag_names: ["4-mySample", "9-myOtherSample", "6-alsoThisSample"]
27+
28+
# VDJ arguments
29+
# vdj_version: "human"
30+
31+
# CWL-runner arguments
32+
parallel: true
33+
timestamps: false
34+
dryrun: false
35+
36+
# Nextflow input-output arguments
37+
publish_dir: # please fill in - example: "output/"
38+
# param_list: "my_params.yaml"
Lines changed: 252 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,252 @@
1+
{
2+
"$schema": "http://json-schema.org/draft-07/schema",
3+
"title": "bd_rhapsody",
4+
"description": "A wrapper for the BD Rhapsody Analysis CWL v1.10.1 pipeline.\n\nThis pipeline can be used for a targeted analysis (with `--mode targeted`) or for a whole transcriptome analysis (with `--mode wta`).\n\n* If mode is `\"targeted\"`, then either the `--reference` or `--abseq_reference` parameters must be defined.\n* If mode is `\"wta\"`, then `--reference` and `--transcriptome_annotation` must be defined, `--abseq_reference` and `--supplemental_reference` is optional.\n\nThe reference_genome and transcriptome_annotation files can be generated with the make_reference pipeline.\nAlternatively, BD also provides standard references which can be downloaded from these locations:\n\n - Human: http://bd-rhapsody-public.s3-website-us-east-1.amazonaws.com/Rhapsody-WTA/GRCh38-PhiX-gencodev29/\n - Mouse: http://bd-rhapsody-public.s3-website-us-east-1.amazonaws.com/Rhapsody-WTA/GRCm38-PhiX-gencodevM19/\n",
5+
"type": "object",
6+
"definitions": {
7+
"inputs" : {
8+
"title": "Inputs",
9+
"type": "object",
10+
"description": "No description",
11+
"properties": {
12+
13+
"mode": {
14+
"type": "string",
15+
"description": "Type: `string`, required, example: `wta`, choices: ``wta`, `targeted``. Whether to run a whole transcriptome analysis (WTA) or a targeted analysis",
16+
"help_text": "Type: `string`, required, example: `wta`, choices: ``wta`, `targeted``. Whether to run a whole transcriptome analysis (WTA) or a targeted analysis.",
17+
"enum": ["wta", "targeted"]
18+
19+
},
20+
21+
"id": {
22+
"type": "string",
23+
"description": "Type: `string`, required, example: `foo`. ID of the sample",
24+
"help_text": "Type: `string`, required, example: `foo`. ID of the sample."
25+
},
26+
27+
"input": {
28+
"type": "string",
29+
"description": "Type: List of `file`, required, example: `input.fastq.gz`, multiple_sep: `\";\"`. Path to your read files in the FASTQ",
30+
"help_text": "Type: List of `file`, required, example: `input.fastq.gz`, multiple_sep: `\";\"`. Path to your read files in the FASTQ.GZ format. You may specify as many R1/R2 read pairs as you want."
31+
},
32+
33+
"reference": {
34+
"type": "string",
35+
"description": "Type: List of `file`, required, example: `reference_genome.tar.gz|reference.fasta`, multiple_sep: `\";\"`. Refence to map to",
36+
"help_text": "Type: List of `file`, required, example: `reference_genome.tar.gz|reference.fasta`, multiple_sep: `\";\"`. Refence to map to. For `--mode wta`, this is the path to STAR index as a tar.gz file. For `--mode targeted`, this is the path to mRNA reference file for pre-designed, supplemental, or custom panel, in FASTA format"
37+
},
38+
39+
"transcriptome_annotation": {
40+
"type": "string",
41+
"description": "Type: `file`, example: `transcriptome.gtf`. Path to GTF annotation file (only for `--mode wta`)",
42+
"help_text": "Type: `file`, example: `transcriptome.gtf`. Path to GTF annotation file (only for `--mode wta`)."
43+
},
44+
45+
"abseq_reference": {
46+
"type": "string",
47+
"description": "Type: List of `file`, example: `abseq_reference.fasta`, multiple_sep: `\";\"`. Path to the AbSeq reference file in FASTA format",
48+
"help_text": "Type: List of `file`, example: `abseq_reference.fasta`, multiple_sep: `\";\"`. Path to the AbSeq reference file in FASTA format. Only needed if BD AbSeq Ab-Oligos are used."
49+
},
50+
51+
"supplemental_reference": {
52+
"type": "string",
53+
"description": "Type: List of `file`, example: `supplemental_reference.fasta`, multiple_sep: `\";\"`. Path to the supplemental reference file in FASTA format",
54+
"help_text": "Type: List of `file`, example: `supplemental_reference.fasta`, multiple_sep: `\";\"`. Path to the supplemental reference file in FASTA format. Only needed if there are additional transgene sequences used in the experiment (only for `--mode wta`)."
55+
},
56+
57+
"sample_prefix": {
58+
"type": "string",
59+
"description": "Type: `string`, default: `sample`. Specify a run name to use as the output file base name",
60+
"help_text": "Type: `string`, default: `sample`. Specify a run name to use as the output file base name. Use only letters, numbers, or hyphens. Do not use special characters or spaces.",
61+
"default": "sample"
62+
}
63+
64+
}
65+
},
66+
"outputs" : {
67+
"title": "Outputs",
68+
"type": "object",
69+
"description": "No description",
70+
"properties": {
71+
72+
"output_raw": {
73+
"type": "string",
74+
"description": "Type: `file`, required, default: `$id.$key.output_raw.output_raw`, example: `output_dir/`. The BD Rhapsody output folder as it comes out of the BD Rhapsody pipeline",
75+
"help_text": "Type: `file`, required, default: `$id.$key.output_raw.output_raw`, example: `output_dir/`. The BD Rhapsody output folder as it comes out of the BD Rhapsody pipeline",
76+
"default": "$id.$key.output_raw.output_raw"
77+
},
78+
79+
"output_h5mu": {
80+
"type": "string",
81+
"description": "Type: `file`, required, default: `$id.$key.output_h5mu.h5mu`, example: `output.h5mu`. The converted h5mu file",
82+
"help_text": "Type: `file`, required, default: `$id.$key.output_h5mu.h5mu`, example: `output.h5mu`. The converted h5mu file.",
83+
"default": "$id.$key.output_h5mu.h5mu"
84+
}
85+
86+
}
87+
},
88+
"putative cell calling settings" : {
89+
"title": "Putative cell calling settings",
90+
"type": "object",
91+
"description": "No description",
92+
"properties": {
93+
94+
"putative_cell_call": {
95+
"type": "string",
96+
"description": "Type: `string`, example: `mRNA`, choices: ``mRNA`, `AbSeq_Experimental``. Specify the dataset to be used for putative cell calling",
97+
"help_text": "Type: `string`, example: `mRNA`, choices: ``mRNA`, `AbSeq_Experimental``. Specify the dataset to be used for putative cell calling. For putative cell calling using an AbSeq dataset, please provide an AbSeq_Reference fasta file above.",
98+
"enum": ["mRNA", "AbSeq_Experimental"]
99+
100+
},
101+
102+
"exact_cell_count": {
103+
"type": "integer",
104+
"description": "Type: `integer`, example: `10000`. Exact cell count - Set a specific number (\u003e=1) of cells as putative, based on those with the highest error-corrected read count",
105+
"help_text": "Type: `integer`, example: `10000`. Exact cell count - Set a specific number (\u003e=1) of cells as putative, based on those with the highest error-corrected read count"
106+
},
107+
108+
"disable_putative_calling": {
109+
"type": "boolean",
110+
"description": "Type: `boolean_true`, default: `false`. Disable Refined Putative Cell Calling - Determine putative cells using only the basic algorithm (minimum second derivative along the cumulative reads curve)",
111+
"help_text": "Type: `boolean_true`, default: `false`. Disable Refined Putative Cell Calling - Determine putative cells using only the basic algorithm (minimum second derivative along the cumulative reads curve). The refined algorithm attempts to remove false positives and recover false negatives, but may not be ideal for certain complex mixtures of cell types. Does not apply if Exact Cell Count is set.",
112+
"default": "False"
113+
}
114+
115+
}
116+
},
117+
"subsample arguments" : {
118+
"title": "Subsample arguments",
119+
"type": "object",
120+
"description": "No description",
121+
"properties": {
122+
123+
"subsample": {
124+
"type": "number",
125+
"description": "Type: `double`, example: `0.01`. A number \u003e1 or fraction (0 \u003c n \u003c 1) to indicate the number or percentage of reads to subsample",
126+
"help_text": "Type: `double`, example: `0.01`. A number \u003e1 or fraction (0 \u003c n \u003c 1) to indicate the number or percentage of reads to subsample."
127+
},
128+
129+
"subsample_seed": {
130+
"type": "integer",
131+
"description": "Type: `integer`, example: `3445`. A seed for replicating a previous subsampled run",
132+
"help_text": "Type: `integer`, example: `3445`. A seed for replicating a previous subsampled run."
133+
}
134+
135+
}
136+
},
137+
"multiplex arguments" : {
138+
"title": "Multiplex arguments",
139+
"type": "object",
140+
"description": "No description",
141+
"properties": {
142+
143+
"sample_tags_version": {
144+
"type": "string",
145+
"description": "Type: `string`, example: `human`, choices: ``human`, `hs`, `mouse`, `mm``. Specify if multiplexed run",
146+
"help_text": "Type: `string`, example: `human`, choices: ``human`, `hs`, `mouse`, `mm``. Specify if multiplexed run.",
147+
"enum": ["human", "hs", "mouse", "mm"]
148+
149+
},
150+
151+
"tag_names": {
152+
"type": "string",
153+
"description": "Type: List of `string`, example: `4-mySample:9-myOtherSample:6-alsoThisSample`, multiple_sep: `\":\"`. Tag_Names (optional) - Specify the tag number followed by \u0027-\u0027 and the desired sample name to appear in Sample_Tag_Metrics",
154+
"help_text": "Type: List of `string`, example: `4-mySample:9-myOtherSample:6-alsoThisSample`, multiple_sep: `\":\"`. Tag_Names (optional) - Specify the tag number followed by \u0027-\u0027 and the desired sample name to appear in Sample_Tag_Metrics.csv.\nDo not use the special characters: \u0026, (), [], {}, \u003c\u003e, ?, |\n"
155+
}
156+
157+
}
158+
},
159+
"vdj arguments" : {
160+
"title": "VDJ arguments",
161+
"type": "object",
162+
"description": "No description",
163+
"properties": {
164+
165+
"vdj_version": {
166+
"type": "string",
167+
"description": "Type: `string`, example: `human`, choices: ``human`, `mouse`, `humanBCR`, `humanBCR`, `humanTCR`, `mouseBCR``. Specify if VDJ run",
168+
"help_text": "Type: `string`, example: `human`, choices: ``human`, `mouse`, `humanBCR`, `humanBCR`, `humanTCR`, `mouseBCR``. Specify if VDJ run.",
169+
"enum": ["human", "mouse", "humanBCR", "humanBCR", "humanTCR", "mouseBCR"]
170+
171+
}
172+
173+
}
174+
},
175+
"cwl-runner arguments" : {
176+
"title": "CWL-runner arguments",
177+
"type": "object",
178+
"description": "No description",
179+
"properties": {
180+
181+
"parallel": {
182+
"type": "boolean",
183+
"description": "Type: `boolean`, default: `true`. Run jobs in parallel",
184+
"help_text": "Type: `boolean`, default: `true`. Run jobs in parallel.",
185+
"default": "True"
186+
},
187+
188+
"timestamps": {
189+
"type": "boolean",
190+
"description": "Type: `boolean_true`, default: `false`. Add timestamps to the errors, warnings, and notifications",
191+
"help_text": "Type: `boolean_true`, default: `false`. Add timestamps to the errors, warnings, and notifications.",
192+
"default": "False"
193+
},
194+
195+
"dryrun": {
196+
"type": "boolean",
197+
"description": "Type: `boolean_true`, default: `false`. If true, the output directory will only contain the CWL input files, but the pipeline itself will not be executed",
198+
"help_text": "Type: `boolean_true`, default: `false`. If true, the output directory will only contain the CWL input files, but the pipeline itself will not be executed.",
199+
"default": "False"
200+
}
201+
202+
}
203+
},
204+
"nextflow input-output arguments" : {
205+
"title": "Nextflow input-output arguments",
206+
"type": "object",
207+
"description": "Input/output parameters for Nextflow itself. Please note that both publishDir and publish_dir are supported but at least one has to be configured.",
208+
"properties": {
209+
210+
"publish_dir": {
211+
"type": "string",
212+
"description": "Type: `string`, required, example: `output/`. Path to an output directory",
213+
"help_text": "Type: `string`, required, example: `output/`. Path to an output directory."
214+
},
215+
216+
"param_list": {
217+
"type": "string",
218+
"description": "Type: `string`, example: `my_params.yaml`. Allows inputting multiple parameter sets to initialise a Nextflow channel",
219+
"help_text": "Type: `string`, example: `my_params.yaml`. Allows inputting multiple parameter sets to initialise a Nextflow channel. A `param_list` can either be a list of maps, a csv file, a json file, a yaml file, or simply a yaml blob.\n\n* A list of maps (as-is) where the keys of each map corresponds to the arguments of the pipeline. Example: in a `nextflow.config` file: `param_list: [ [\u0027id\u0027: \u0027foo\u0027, \u0027input\u0027: \u0027foo.txt\u0027], [\u0027id\u0027: \u0027bar\u0027, \u0027input\u0027: \u0027bar.txt\u0027] ]`.\n* A csv file should have column names which correspond to the different arguments of this pipeline. Example: `--param_list data.csv` with columns `id,input`.\n* A json or a yaml file should be a list of maps, each of which has keys corresponding to the arguments of the pipeline. Example: `--param_list data.json` with contents `[ {\u0027id\u0027: \u0027foo\u0027, \u0027input\u0027: \u0027foo.txt\u0027}, {\u0027id\u0027: \u0027bar\u0027, \u0027input\u0027: \u0027bar.txt\u0027} ]`.\n* A yaml blob can also be passed directly as a string. Example: `--param_list \"[ {\u0027id\u0027: \u0027foo\u0027, \u0027input\u0027: \u0027foo.txt\u0027}, {\u0027id\u0027: \u0027bar\u0027, \u0027input\u0027: \u0027bar.txt\u0027} ]\"`.\n\nWhen passing a csv, json or yaml file, relative path names are relativized to the location of the parameter file. No relativation is performed when `param_list` is a list of maps (as-is) or a yaml blob.",
220+
"hidden": true
221+
}
222+
223+
}
224+
}
225+
},
226+
"allOf": [
227+
{
228+
"$ref": "#/definitions/inputs"
229+
},
230+
{
231+
"$ref": "#/definitions/outputs"
232+
},
233+
{
234+
"$ref": "#/definitions/putative cell calling settings"
235+
},
236+
{
237+
"$ref": "#/definitions/subsample arguments"
238+
},
239+
{
240+
"$ref": "#/definitions/multiplex arguments"
241+
},
242+
{
243+
"$ref": "#/definitions/vdj arguments"
244+
},
245+
{
246+
"$ref": "#/definitions/cwl-runner arguments"
247+
},
248+
{
249+
"$ref": "#/definitions/nextflow input-output arguments"
250+
}
251+
]
252+
}
Lines changed: 21 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,21 @@
1+
# Inputs
2+
id: # please fill in - example: "foo"
3+
input: # please fill in - example: ["sample_S1_L001_R1_001.fastq.gz", "sample_S1_L001_R2_001.fastq.gz"]
4+
reference: # please fill in - example: "reference.tar.gz"
5+
6+
# Outputs
7+
# output_raw: "$id.$key.output_raw.output_raw"
8+
# output_h5mu: "$id.$key.output_h5mu.h5mu"
9+
uns_metrics: "metrics_summary"
10+
output_type: "raw"
11+
12+
# Cell Ranger arguments
13+
# expect_cells: 3000
14+
chemistry: "auto"
15+
secondary_analysis: false
16+
generate_bam: true
17+
include_introns: true
18+
19+
# Nextflow input-output arguments
20+
publish_dir: # please fill in - example: "output/"
21+
# param_list: "my_params.yaml"

0 commit comments

Comments
 (0)