From 86ccdbb5cb1aea7ed3a738a34da1ed29992d3ac2 Mon Sep 17 00:00:00 2001
From: shahules786 <shahules786@gmail.com>
Date: Mon, 22 Aug 2022 10:05:34 +0530
Subject: [PATCH] dataset

---
 enhancer/data/vctk.py | 38 ++++++++++++++++++++++++++++++++++++++
 1 file changed, 38 insertions(+)
 create mode 100644 enhancer/data/vctk.py

diff --git a/enhancer/data/vctk.py b/enhancer/data/vctk.py
new file mode 100644
index 0000000..2e46662
--- /dev/null
+++ b/enhancer/data/vctk.py
@@ -0,0 +1,38 @@
+
+from genericpath import isdir
+import librosa
+import os
+from torch.utils.data import IterableDataset
+import torch
+
+
+class Vctk(IterableDataset):
+    """Dataset object for Voice Bank Corpus (VCTK) Dataset"""
+
+    def __init__(self,clean_path,noisy_path,sample_length=1,num_samples=None):
+        
+        if not os.path.isdir(clean_path):
+            raise ValueError(f"{clean_path} is not a valid directory")
+
+        if not os.path.isdir(noisy_path):
+            raise ValueError(f"{clean_path} is not a valid directory")
+
+        self.clean_path = clean_path
+        self.noisy_path = noisy_path
+
+        if num_samples is None:
+            self.num_samples = len([file for file in os.listdir(clean_path) if file.endswith(".wav")])
+        else:
+            self.num_samples = num_samples
+
+        self.sample_length = max(0.1,sample_length)
+
+    def __iter__(self):
+
+        
+
+
+        pass
+
+    def __len__(self):
+        pass