huyanxin · qianjr2002 · Nov 30, 2024 · Nov 30, 2024
diff --git a/.gitignore b/.gitignore
@@ -0,0 +1 @@
+__pychache__/
diff --git a/README.md b/README.md
@@ -5,3 +5,4 @@ Paper: https://arxiv.org/abs/2008.00264
 
 Sample: https://huyanxin.github.io/DeepComplexCRN/
 
+Python 3.10.15 (main, Oct  3 2024, 07:27:34) [GCC 11.2.0] on linux
diff --git a/data_loader.py b/data_loader.py
@@ -0,0 +1,63 @@
+import os
+import torch
+import torchaudio
+from torch.utils.data import Dataset, DataLoader
+
+
+class VCTKDataset(Dataset):
+    def __init__(self, clean_dir, noisy_dir, max_length=160000):
+        self.clean_dir = clean_dir
+        self.noisy_dir = noisy_dir
+        self.clean_files = sorted(os.listdir(clean_dir))
+        self.noisy_files = sorted(os.listdir(noisy_dir))
+        assert len(self.clean_files) == len(self.noisy_files), \
+            "Mismatch between number of clean and noisy files."
+        self.max_length = max_length
+        self.n_fft = 512
+        self.hop_length = 256
+        self.win_length = 512
+        self.window_fn = torch.hann_window(
+            self.win_length).sqrt()
+
+    def __len__(self):
+        return len(self.clean_files)
+
+    def __getitem__(self, idx):
+        clean_path = os.path.join(self.clean_dir, self.clean_files[idx])
+        noisy_path = os.path.join(self.noisy_dir, self.noisy_files[idx])
+
+        clean_signal, _ = torchaudio.load(clean_path)
+        noisy_signal, _ = torchaudio.load(noisy_path)
+
+        min_length = min(clean_signal.size(
+            1), noisy_signal.size(1), self.max_length)
+        clean_signal = clean_signal[:, :min_length]
+        noisy_signal = noisy_signal[:, :min_length]
+
+        if clean_signal.shape[1] < self.max_length:
+            pad_amount = self.max_length - clean_signal.shape[1]
+            clean_signal = torch.nn.functional.pad(
+                clean_signal, (0, pad_amount))
+            noisy_signal = torch.nn.functional.pad(
+                noisy_signal, (0, pad_amount))
+
+        window_fn = self.window_fn.to(clean_signal.device)
+
+        clean_spec = torch.stft(
+            clean_signal, n_fft=self.n_fft, hop_length=self.hop_length,
+            win_length=self.win_length, window=window_fn, return_complex=True
+        )
+        noisy_spec = torch.stft(
+            noisy_signal, n_fft=self.n_fft, hop_length=self.hop_length,
+            win_length=self.win_length, window=window_fn, return_complex=True
+        )
+
+        clean_spec = torch.view_as_real(clean_spec)
+        noisy_spec = torch.view_as_real(noisy_spec)
+
+        return noisy_spec, clean_spec
+
+
+def create_dataloader(clean_dir, noisy_dir, batch_size, max_length=160000):
+    dataset = VCTKDataset(clean_dir, noisy_dir, max_length)
+    return DataLoader(dataset, batch_size=batch_size, shuffle=True)
diff --git a/dataset.py b/dataset.py
@@ -0,0 +1,31 @@
+import os
+import torchaudio
+from torch.utils.data import Dataset
+
+
+class VCTKDEMANDDataset(Dataset):
+    def __init__(self, root_dir, transform=None):
+        self.root_dir = root_dir
+        self.transform = transform
+        self.clean_files = sorted(os.listdir(
+            os.path.join(root_dir, 'train', 'clean')))
+        self.noisy_files = sorted(os.listdir(
+            os.path.join(root_dir, 'train', 'noisy')))
+
+    def __len__(self):
+        return len(self.clean_files)
+
+    def __getitem__(self, idx):
+        clean_path = os.path.join(
+            self.root_dir, 'train', 'clean', self.clean_files[idx])
+        noisy_path = os.path.join(
+            self.root_dir, 'train', 'noisy', self.noisy_files[idx])
+
+        clean_waveform, _ = torchaudio.load(clean_path)
+        noisy_waveform, _ = torchaudio.load(noisy_path)
+
+        if self.transform:
+            clean_waveform = self.transform(clean_waveform)
+            noisy_waveform = self.transform(noisy_waveform)
+
+        return noisy_waveform, clean_waveform
Original file line number	Diff line number	Diff line change
Expand Up		@@ -5,3 +5,4 @@ Paper: https://arxiv.org/abs/2008.00264

		Sample: https://huyanxin.github.io/DeepComplexCRN/

		Python 3.10.15 (main, Oct 3 2024, 07:27:34) [GCC 11.2.0] on linux