@@ -128,7 +128,7 @@ Data Objects:
128
128
- data_object_type : Metagenome Raw Reads
129
129
description : Metagenome Raw Reads for {id}
130
130
name : Raw sequencer read data
131
- import_suffix : .[A-Z ]+-[A-Z]+ .fastq.gz
131
+ import_suffix : \.[ACGT ]+-[ACGT]+\ .fastq\ .gz$
132
132
nmdc_suffix : .fastq.gz
133
133
input_to : [nmdc:ReadQcAnalysis]
134
134
output_of : nmdc:NucleotideSequencing
@@ -137,7 +137,7 @@ Data Objects:
137
137
- data_object_type : Annotation Amino Acid FASTA
138
138
description : FASTA Amino Acid File for {id}
139
139
name : FASTA amino acid file for annotated proteins
140
- import_suffix : _proteins.faa
140
+ import_suffix : " ^(?!.*_(cds|genemark|prodigal) _proteins\\ .faa$).*proteins \\ .faa$ "
141
141
nmdc_suffix : _proteins.faa
142
142
input_to : []
143
143
output_of : nmdc:MetatranscriptomeAnnotation
@@ -146,7 +146,7 @@ Data Objects:
146
146
- data_object_type : Contig Mapping File
147
147
description : Contig mapping file for {id}
148
148
name : Contig mappings between old and new contig names
149
- import_suffix : _contig_names_mapping.tsv
149
+ import_suffix : " _contig_names_mapping\\ .tsv$ "
150
150
nmdc_suffix : _contig_names_mapping.tsv
151
151
input_to : []
152
152
output_of : nmdc:MetatranscriptomeAnnotation
@@ -155,7 +155,7 @@ Data Objects:
155
155
- data_object_type : Structural Annotation GFF
156
156
description : Structural Annotation for {id}
157
157
name : GFF3 format file with structural annotations
158
- import_suffix : _structural_annotation.gff
158
+ import_suffix : _structural_annotation\ .gff$
159
159
nmdc_suffix : _structural_annotation.gff
160
160
input_to : []
161
161
output_of : nmdc:MetatranscriptomeAnnotation
@@ -164,7 +164,7 @@ Data Objects:
164
164
- data_object_type : Functional Annotation GFF
165
165
description : Functional Annotation for {id}
166
166
name : GFF3 format file with functional annotations
167
- import_suffix : _functional_annotation.gff
167
+ import_suffix : _functional_annotation\ .gff$
168
168
nmdc_suffix : _functional_annotation.gff
169
169
input_to : [nmdc:MetatranscriptomeExpressionAnalysis]
170
170
output_of : nmdc:MetatranscriptomeAnnotation
@@ -173,7 +173,7 @@ Data Objects:
173
173
- data_object_type : Annotation KEGG Orthology
174
174
description : KEGG Orthology for {id}
175
175
name : Tab delimited file for KO annotation
176
- import_suffix : _ko.tsv
176
+ import_suffix : _ko\ .tsv$
177
177
nmdc_suffix : _ko.tsv
178
178
input_to : []
179
179
output_of : nmdc:MetatranscriptomeAnnotation
@@ -182,7 +182,7 @@ Data Objects:
182
182
- data_object_type : Annotation Enzyme Commission
183
183
description : EC Annotations for {id}
184
184
name : Tab delimited file for EC annotation
185
- import_suffix : _ec.tsv
185
+ import_suffix : _ec\ .tsv$
186
186
nmdc_suffix : _ec.tsv
187
187
input_to : []
188
188
output_of : nmdc:MetatranscriptomeAnnotation
@@ -191,15 +191,15 @@ Data Objects:
191
191
- data_object_type Scaffold Lineage tsv
192
192
description : Scaffold Lineage tsv for {id}
193
193
name : Phylogeny at the scaffold level
194
- import_suffix : _scaffold_lineage.tsv
194
+ import_suffix : _scaffold_lineage\ .tsv$
195
195
nmdc_suffix : _scaffold_lineage.tsv
196
196
input_to : []
197
197
output_of : nmdc:MetatranscriptomeAnnotation
198
198
multiple : false
199
199
- data_object_type : Clusters of Orthologous Groups (COG) Annotation GFF
200
200
description : COGs for {id}
201
201
name : GFF3 format file with COGs
202
- import_suffix : _cog.gff
202
+ import_suffix : _cog\ .gff$
203
203
nmdc_suffix : _cog.gff
204
204
input_to : []
205
205
output_of : nmdc:MetatranscriptomeAnnotation
@@ -208,7 +208,7 @@ Data Objects:
208
208
- data_object_type : Pfam Annotation GFF
209
209
description : Pfam Annotation for {id}
210
210
name : GFF3 format file with Pfam
211
- import_suffix : _pfam.gff
211
+ import_suffix : _pfam\ .gff$
212
212
nmdc_suffix : _pfam.gff
213
213
input_to : []
214
214
output_of : nmdc:MetatranscriptomeAnnotation
@@ -217,7 +217,7 @@ Data Objects:
217
217
- data_object_type : TIGRFam Annotation GFF
218
218
description : TIGRFam for {id}
219
219
name : GFF3 format file with TIGRfam
220
- import_suffix : _tigrfam.gff
220
+ import_suffix : _tigrfam\ .gff$
221
221
nmdc_suffix : _tigrfam.gff
222
222
input_to : []
223
223
output_of : nmdc:MetatranscriptomeAnnotation
@@ -226,7 +226,7 @@ Data Objects:
226
226
- data_object_type : SMART Annotation GFF
227
227
description : SMART Annotations for {id}
228
228
name : GFF3 format file with SMART
229
- import_suffix : _smart.gff
229
+ import_suffix : _smart\ .gff$
230
230
nmdc_suffix : _smart.gff
231
231
input_to : []
232
232
output_of : nmdc:MetatranscriptomeAnnotation
@@ -235,7 +235,7 @@ Data Objects:
235
235
- data_object_type : SUPERFam Annotation GFF
236
236
description : SUPERFam Annotations for {id}
237
237
name : GFF3 format file with SUPERFam
238
- import_suffix : _supfam.gff
238
+ import_suffix : _supfam\ .gff$
239
239
nmdc_suffix : _supfam.gff
240
240
input_to : []
241
241
output_of : nmdc:MetatranscriptomeAnnotation
@@ -244,7 +244,7 @@ Data Objects:
244
244
- data_object_type : CATH FunFams (Functional Families) Annotation GFF
245
245
description : CATH FunFams for {id}
246
246
name : GFF3 format file with CATH FunFams
247
- import_suffix : _cath_funfam.gff
247
+ import_suffix : _cath_funfam\ .gff$
248
248
nmdc_suffix : _cath_funfam.gff
249
249
input_to : []
250
250
output_of : nmdc:MetatranscriptomeAnnotation
@@ -253,7 +253,7 @@ Data Objects:
253
253
- data_object_type : CRT Annotation GFF
254
254
description : CRT Annotations for {id}
255
255
name : GFF3 format file with CRT
256
- import_suffix : _crt.gff
256
+ import_suffix : _crt\ .gff$
257
257
nmdc_suffix : _crt.gff
258
258
input_to : []
259
259
output_of : nmdc:MetatranscriptomeAnnotation
@@ -262,7 +262,7 @@ Data Objects:
262
262
- data_object_type : Genemark Annotation GFF
263
263
description : Genemark Annotations for {id}
264
264
name : GFF3 format file with Genemark
265
- import_suffix : _genemark.gff
265
+ import_suffix : _genemark\ .gff$
266
266
nmdc_suffix : _genemark.gff
267
267
input_to : []
268
268
output_of : nmdc:MetatranscriptomeAnnotation
@@ -271,7 +271,7 @@ Data Objects:
271
271
- data_object_type : Prodigal Annotation GFF
272
272
description : Prodigal Annotations {id}
273
273
name : GFF3 format file with Prodigal
274
- import_suffix : _prodigal.gff
274
+ import_suffix : _prodigal\ .gff$
275
275
nmdc_suffix : _prodigal.gff
276
276
input_to : []
277
277
output_of : nmdc:MetatranscriptomeAnnotation
@@ -280,7 +280,7 @@ Data Objects:
280
280
- data_object_type : TRNA Annotation GFF
281
281
description : TRNA Annotations {id}
282
282
name : GFF3 format file with TRNA
283
- import_suffix : _trna.gff
283
+ import_suffix : _trna\ .gff$
284
284
nmdc_suffix : _trna.gff
285
285
input_to : []
286
286
output_of : nmdc:MetatranscriptomeAnnotation
@@ -289,7 +289,7 @@ Data Objects:
289
289
- data_object_type : RFAM Annotation GFF
290
290
description : RFAM Annotations for {id}
291
291
name : GFF3 format file with RFAM
292
- import_suffix : _rfam.gff
292
+ import_suffix : _rfam\ .gff$
293
293
nmdc_suffix : _rfam.gff
294
294
input_to : []
295
295
output_of : nmdc:MetatranscriptomeAnnotation
@@ -298,7 +298,7 @@ Data Objects:
298
298
- data_object_type : KO_EC Annotation GFF
299
299
description : KO_EC Annotations for {id}
300
300
name : GFF3 format file with KO_EC
301
- import_suffix : _ko_ec.gff
301
+ import_suffix : _ko_ec\ .gff$
302
302
nmdc_suffix : _ko_ec.gff
303
303
input_to : []
304
304
output_of : nmdc:MetatranscriptomeAnnotation
@@ -307,7 +307,7 @@ Data Objects:
307
307
- data_object_type : Product Names
308
308
description : Product names for {id}
309
309
name : Product names file
310
- import_suffix : _product_names.tsv
310
+ import_suffix : _product_names\ .tsv$
311
311
nmdc_suffix : _product_names.tsv
312
312
input_to : []
313
313
output_of : nmdc:MetatranscriptomeAnnotation
@@ -316,7 +316,7 @@ Data Objects:
316
316
- data_object_type : Gene Phylogeny tsv
317
317
description : Gene Phylogeny for {id}
318
318
name : Gene Phylogeny file
319
- import_suffix : _gene_phylogeny.tsv
319
+ import_suffix : _gene_phylogeny\ .tsv$
320
320
nmdc_suffix : _gene_phylogeny.tsv
321
321
input_to : []
322
322
output_of : nmdc:MetatranscriptomeAnnotation
@@ -325,7 +325,7 @@ Data Objects:
325
325
- data_object_type : Crispr Terms
326
326
description : Crispr Terms for {id}
327
327
name : Crispr Terms
328
- import_suffix : _crt.crisprs
328
+ import_suffix : _crt\ .crisprs$
329
329
nmdc_suffix : _crt.crisprs
330
330
input_to : []
331
331
output_of : nmdc:MetatranscriptomeAnnotation
@@ -334,7 +334,7 @@ Data Objects:
334
334
- data_object_type : Annotation Statistics
335
335
description : Annotation Stats for {id}
336
336
name : Annotation statistics report
337
- import_suffix : _stats.tsv
337
+ import_suffix : _stats\ .tsv$
338
338
nmdc_suffix : _stats.tsv
339
339
input_to : []
340
340
output_of : nmdc:MetatranscriptomeAnnotation
@@ -343,23 +343,23 @@ Data Objects:
343
343
- data_object_type : Annotation Info File
344
344
description : Annotation Info File for {id}
345
345
name : File containing annotation info
346
- import_suffix : _imgap.info
346
+ import_suffix : _imgap\ .info$
347
347
nmdc_suffix : _imgap.info
348
348
input_to : []
349
349
output_of : nmdc:MetatranscriptomeAnnotation
350
350
multiple : false
351
351
action : rename
352
352
- data_object_type : Assembly Contigs
353
353
description : Assembly contigs (remapped) for {id}
354
- import_suffix : _contigs.fna
354
+ import_suffix : _contigs\ .fna$
355
355
nmdc_suffix : _renamed_contigs.fna
356
356
input_to : []
357
357
output_of : nmdc:MetatranscriptomeAnnotation
358
358
multiple : false
359
359
- data_object_type : Filtered Sequencing Reads
360
360
description : Reads QC for {id}
361
361
name : Reads QC result fastq (clean data)
362
- import_suffix : filter-MTF.fastq.gz
362
+ import_suffix : filter-MTF\ .fastq\ .gz$
363
363
nmdc_suffix : _filtered.fastq.gz
364
364
input_to : [nmdc:MetatranscriptomeAssembly]
365
365
output_of : nmdc:ReadQcAnalysis
@@ -368,7 +368,7 @@ Data Objects:
368
368
- data_object_type : rRNA Filtered Sequencing Reads
369
369
description : Reads QC rRNA reads file for {id}
370
370
name : Reads QC rRNA reads result fastq (clean data)
371
- import_suffix : .rRNA.fastq.gz
371
+ import_suffix : \ .rRNA\ .fastq\ .gz$
372
372
nmdc_suffix : _rRNA.fastq.gz
373
373
input_to : []
374
374
output_of : nmdc:ReadQcAnalysis
@@ -377,7 +377,7 @@ Data Objects:
377
377
- data_object_type : QC Statistics
378
378
description : Reads QC summary for {id}
379
379
name : Reads QC summary statistics
380
- import_suffix : .filtered-report.txt
380
+ import_suffix : \ .filtered-report\ .txt$
381
381
nmdc_suffix : _filterStats.txt
382
382
input_to : []
383
383
output_of : nmdc:ReadQcAnalysis
@@ -386,7 +386,7 @@ Data Objects:
386
386
- data_object_type : Read Filtering Info File
387
387
description : Read Filtering Info File for {id}
388
388
name : File containing read filtering information
389
- import_suffix : .filter_cmd-MTF.sh
389
+ import_suffix : \ .filter_cmd-MTF\ .sh$
390
390
nmdc_suffix : _readsQC.info
391
391
input_to : []
392
392
output_of : nmdc:ReadQcAnalysis
@@ -395,7 +395,7 @@ Data Objects:
395
395
- data_object_type : Assembly Contigs
396
396
description : Assembly contigs for {id}
397
397
name : Final assembly contigs fasta
398
- import_suffix : assembly.contigs.fasta
398
+ import_suffix : assembly\ .contigs\ .fasta$
399
399
nmdc_suffix : _contigs.fna
400
400
input_to : [nmdc:MetatranscriptomeAnnotation]
401
401
output_of : nmdc:MetatranscriptomeAssembly
@@ -404,7 +404,7 @@ Data Objects:
404
404
- data_object_type : Assembly Info File
405
405
description : Assembly info file for {id}
406
406
name : File containing assembly information
407
- import_suffix : README.txt
407
+ import_suffix : README\ .txt$
408
408
nmdc_suffix : _metaAsm.info
409
409
input_to : []
410
410
output_of : nmdc:MetatranscriptomeAssembly
@@ -414,15 +414,15 @@ Data Objects:
414
414
description : Coverage Stats for {id}
415
415
name : Assembled contigs coverage information
416
416
import_suffix : pairedMapped_sorted.bam.cov
417
- nmdc_suffix : _covstats.txt
417
+ nmdc_suffix : _covstats\ .txt$
418
418
input_to : []
419
419
output_of : nmdc:MetatranscriptomeAssembly
420
420
multiple : false
421
421
action : rename
422
422
- data_object_type : Assembly Coverage BAM
423
423
description : Sorted Bam for {id}
424
424
name : Sorted bam file of reads mapping back to the final assembly
425
- import_suffix : pairedMapped.bam.gz
425
+ import_suffix : pairedMapped\ .bam\ .gz$
426
426
nmdc_suffix : _pairedMapped_sorted.bam.gz
427
427
input_to : [nmdc:MetatranscriptomeExpressionAnalysis]
428
428
output_of : nmdc:MetatranscriptomeAssembly
@@ -431,7 +431,7 @@ Data Objects:
431
431
- data_object_type : BAI File
432
432
description : Alignment index file for {id}
433
433
name : BAM index file
434
- import_suffix : _pairedMapped_sorted.bam.bai
434
+ import_suffix : _pairedMapped_sorted\ .bam\ .bai$
435
435
nmdc_suffix : _pairedMapped_sorted.bam.bai
436
436
input_to : []
437
437
output_of : nmdc:MetatranscriptomeAssembly
@@ -440,7 +440,7 @@ Data Objects:
440
440
- data_object_type : Metatranscriptome Expression
441
441
description : Expression counts for {id}
442
442
name : Expression counts file
443
- import_suffix : .rnaseq_gea.txt
443
+ import_suffix : \ .rnaseq_gea\ .txt$
444
444
nmdc_suffix : _rnaseq_gea.txt
445
445
input_to : []
446
446
output_of : nmdc:MetatranscriptomeExpressionAnalysis
@@ -449,7 +449,7 @@ Data Objects:
449
449
- data_object_type : Metatranscriptome Expression Intergenic
450
450
description : Expression intergenic counts for {id}
451
451
name : Expression intergenic counts file
452
- import_suffix : .rnaseq_gea.intergenic.txt
452
+ import_suffix : \ .rnaseq_gea\ .intergenic\ .txt$
453
453
nmdc_suffix : _rnaseq_gea.intergenic.txt
454
454
input_to : []
455
455
output_of : nmdc:MetatranscriptomeExpressionAnalysis
0 commit comments