-
Notifications
You must be signed in to change notification settings - Fork 2
/
mapping_config_defaults.yaml
122 lines (111 loc) · 3.89 KB
/
mapping_config_defaults.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
#---------------------------------------- general pipeline parameters
pipeline_param:
# adjust pattern of stored files
out_path_pattern: mapping/{step}/{sample}.{mate}/out/{step}.{sample}.{mate}.{extension}
log_path_pattern: mapping/{step}/{sample}.{mate}/report/{step}.{sample}.{mate}.{extension}
in_path_pattern: ../input/{sample}/{sample}.{mate}
# adjust which files to produce
mapping_results:
- salmon-transcript_counts
- star-gene_counts
- ciri-circRNA
QC_results:
- fastqc
- dupradar
- infer_experiment
- qualimap_rnaseq
- qualimap_bamqc
#- rna_seqc
- preseq_c_curve
- preseq_lc_extrap
#- bw_from_bed
#ATAC_Seq:
# - macs2
test_config: true
report_snippets: ""
#---------------------------------------- organism annotation
organism_defaults: null
#---------------------------------------- parameters for rules
rule_options:
star:
cmd_opt: "--outSAMunmapped Within --outFilterType BySJout --outFilterMultimapNmax 20 --alignSJoverhangMin 8 --alignSJDBoverhangMin 1 --outFilterMismatchNmax 999 --outFilterMismatchNoverLmax 0.04 --alignIntronMin 20 --alignIntronMax 1000000 --alignMatesGapMax 1000000 --genomeLoad NoSharedMemory --outSAMattributes NH HI AS NM MD --outSAMtype BAM Unsorted"
trim: yes
star_index:
cmd_opt: "--sjdbOverhang 49" # optimally sjdbOverhang = <read_length> - 1
salmon_index:
cmd_opt: "-k 31" # (k the default k-mer size of 31 is suitable for read length around 75)
salmon:
cmd_opt: ""
trim: yes
rna_seqc:
cmd_opt: ""
ciri:
cmd_opt: "-low -S 500000"
bwa:
cmd_opt: "-T 19"
trim: yes
run_stats: yes
bwa_index:
cmd_opt: ""
feature_counts:
cmd_opt: ""
#---------------------------------------- parameters for the report
report:
multiqc:
title: SeA-SnaP mapping pipeline QC report
subtitle: run at the BIH CUBI
intro_text: The reports summarises results of several analyses
custom_logo: documentation/pictures/SeA-SnaP_logo.png
sp:
fastqc/zip:
fn: '*_fastqc.zip'
qualimap/rnaseq/rnaseq_results:
fn: '*rnaseq_qc_results.txt'
qualimap/rnaseq/coverage:
fn: '*coverage_profile_along_genes_(total).txt'
qualimap/bamqc/genome_results:
fn: '*genome_results.txt'
qualimap/bamqc/coverage:
fn: '*coverage_histogram.txt'
qualimap/bamqc/insert_size:
fn: '*insert_size_histogram.txt'
qualimap/bamqc/genome_fraction:
fn: '*genome_fraction_coverage.txt'
qualimap/bamqc/gc_dist:
fn: '*mapped_reads_gc-content_distribution.txt'
salmon/meta:
fn: '*meta_info.json'
contents: 'salmon_version'
salmon/fld:
fn: '*flenDist.txt'
#---------------------------------------- configuration for export
export:
blueprint:
file: SODAR_export_blueprint.txt
command: |
imkdir -p $(dirname {dest} )
irsync -a -K {src} i:{dest}
path_pattern:
- __SODAR__/{sample}/{GENOME}/%Y_%m_%d/{files:ngs_mapping:out}/{step}/out/{step}.{sample}.{extension}
- __SODAR__/{sample}/{GENOME}/%Y_%m_%d/{files:ngs_mapping:rep}/{step}/report.zip
- __SODAR__/{sample}/{GENOME}/%Y_%m_%d/{files:gene_expression_quantification}/{step}/out/{step}.{sample}.{extension}
ngs_mapping_out:
- files: {step: star, extension: bam}
ngs_mapping_rep:
- dir: {step: star, log: true}
compress: zip
gene_expression_quantification:
- files: {step: star, extension: gene_counts.tab}
- files: {step: salmon, extension: sf}
UCSC_export:
blueprint: false
path_pattern:
- my_UCSC_track_hub/{GENOME}/{files:mapped_reads}.{step}.{sample}.{extension}
mapped_reads:
- files: {step: star, mate: all_mates, extension: bam}
- files: {step: star, mate: all_mates, extension: bam.bai}
#---------------------------------------- circRNA report
circRNA_report:
snippet_parameters: {}
defaults: {}
report_snippets: []