forked from microsoft/DNS-Challenge
-
Notifications
You must be signed in to change notification settings - Fork 0
/
pdns_synthesizer_icassp2023.cfg
137 lines (122 loc) · 5.58 KB
/
pdns_synthesizer_icassp2023.cfg
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
# Configuration for generating Noisy Speech Dataset
# - sampling_rate: Specify the sampling rate. Default is 16 kHz
# - audioformat: default is .wav
# - audio_length: Minimum Length of each audio clip (noisy and clean speech) in seconds that will be generated by augmenting utterances.
# - silence_length: Duration of silence introduced between clean speech utterances.
# - total_hours: Total number of hours of data required. Units are in hours.
# - snr_lower: Lower bound for SNR required (default: 0 dB)
# - snr_upper: Upper bound for SNR required (default: 40 dB)
# - target_level_lower: Lower bound for the target audio level before audiowrite (default: -35 dB)
# - target_level_upper: Upper bound for the target audio level before audiowrite (default: -15 dB)
# - total_snrlevels: Number of SNR levels required (default: 5, which means there are 5 levels between snr_lower and snr_upper)
# - clean_activity_threshold: Activity threshold for clean speech
# - noise_activity_threshold: Activity threshold for noise
# - fileindex_start: Starting file ID that will be used in filenames
# - fileindex_end: Last file ID that will be used in filenames
# - is_test_set: Set it to True if it is the test set, else False for the training set
# - noise_dir: Specify the directory path to all noise files
# - Speech_dir: Specify the directory path to all clean speech files
# - noisy_destination: Specify path to the destination directory to store noisy speech
# - clean_destination: Specify path to the destination directory to store clean speech
# - noise_destination: Specify path to the destination directory to store noise speech
# - log_dir: Specify path to the directory to store all the log files
# Configuration for unit tests
# - snr_test: Set to True if SNR test is required, else False
# - norm_test: Set to True if Normalization test is required, else False
# - sampling_rate_test: Set to True if Sampling Rate test is required, else False
# - clipping_test: Set to True if Clipping test is required, else False
# - unit_tests_log_dir: Specify path to the directory where you want to store logs
[noisy_speech]
sampling_rate: 48000
audioformat: *.wav
audio_length: 30
# 15, 12, 30
silence_length: 0.2
total_hours: 1000
# 1000
#200
# 2.5, 500, 100
snr_lower: -5
#-5, 0
snr_upper: 20
# 25, 40
randomize_snr: True
target_level_lower: -35
target_level_upper: -15
total_snrlevels: 31
# 5
clean_activity_threshold: 0.0
noise_activity_threshold: 0.2
fileindex_start: None
fileindex_end: None
is_test_set: False
# True, False
noise_dir: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/noise
#/mnt/f/4th_DNSChallenge/INTERSPEECH_2021/DNS-Challenge/datasets_fullband/noise
#F:\4th_DNSChallenge\INTERSPEECH_2021\DNS-Challenge\datasets_fullband\noise
#datasets\pdns_training_set\noise
#\test_set2\Test_Noise
# datasets\noise
# \datasets\noise
speech_dir: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/clean
# D:\kanhawin_git\primary_speakers_VCTK_16k_for_synthesizer
# datasets\test_set2\Singing_Voice\wav_16k
# dir with secondary speaker clean speech
speech_dir2: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/clean
#D:\kanhawin_git\secondary_speakers_voxCeleb2_16k
# datasets\test_set2\Singing_Voice\wav_16k
spkid_csv: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/filelists/complete_ps_split.csv
#/mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/filelists/vctk_spkid.csv
# datasets\clean
noise_types_excluded: None
rir_dir: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/pdns_training_set/impulse_responses
#/mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/impulse_responses
# F:\4th_DNSChallenge\ICASSP_2022\DNS-Challenge\datasets\impulse_responses
# \datasets\clean
noisy_destination: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/pdns_training_set/mixed/noisy
# datasets/training_data/noisy
# datasets\test_set2\synthetic_personalizeddns\noisy
#training_set2_onlyrealrir\noisy
#\noisy
clean_destination: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/pdns_training_set/mixed/clean
#datasets\test_set2\synthetic_personalizeddns\clean
# training_set2_onlyrealrir\clean
# \clean
noise_destination: /mnt/f/4th_DNSChallenge/ICASSP_2022/DNS-Challenge/datasets/pdns_training_set/mixed/noise
# datasets/training_data/noise
#datasets\test_set2\synthetic_personalizeddns\noise
#training_set2_onlyrealrir\noise
# \noise
log_dir: logs
# \logs
# Config: add singing voice to clean speech
clean_singing: datasets\clean_singing\VocalSet11\FULL
singing_choice: 3
# 1 for only male, 2 for only female, 3 (default) for both male and female
# Config: add reverb to clean speech
rir_choice: 1
# 1 for only real rir, 2 for only synthetic rir, 3 (default) use both real and synthetic
lower_t60: 0.3
# lower bound of t60 range in seconds
upper_t60: 1.3
# upper bound of t60 range in seconds
rir_table_csv: datasets\acoustic_params\RIR_table_simple.csv
clean_speech_t60_csv: datasets\acoustic_params\cleanspeech_table_t60_c50.csv
# percent_for_adding_reverb=0.5 # percentage of clean speech convolved with RIR
# pdns testsets
# primary_data: D:\kanhawin_git\primary_speakers_VCTK_16k
#'D:\PersonalizedDNS_dataset\synthetic_primary'
# secondary_data='D:\kanhawin_git\secondary_speakers_voxCeleb2_16k'
#'D:\PersonalizedDNS_dataset\synthetic_secondary'
# noise_data= datasets\test_set2\synthetic\noise
# pdns_testset_clean= datasets\test_set2\pdns\clean
# pdns_testset_noisy= datasets\test_set2\pdns\noisy
# adaptation_data_seconds=120
# num_primary_spk=100
# num_clips=600
# Unit tests config
snr_test: True
norm_test: True
sampling_rate_test = True
clipping_test = True
unit_tests_log_dir: unittests_logs