Skip to content

Commit

Permalink
Add comment to dataloader_audio.py
Browse files Browse the repository at this point in the history
  • Loading branch information
yeexunwei committed Sep 30, 2021
1 parent 1b1b165 commit 280ac0f
Showing 1 changed file with 11 additions and 21 deletions.
32 changes: 11 additions & 21 deletions dataloader_audio.py
Original file line number Diff line number Diff line change
Expand Up @@ -5,6 +5,11 @@
from utils import TextProcess

class AudioDataset(torch.utils.data.Dataset):
"""
Load data from directory.
wav audio is transformed to spectogram.
Return (spectrogram, label, spec_len, label_len) to dataloader
"""

def __init__(self, audio_dir, label_dir, sample_rate=16000, n_feats=128, transform=None):
labels = []
Expand Down Expand Up @@ -48,8 +53,11 @@ def __getitem__(self, index):

def collate_fn(batch):

# A data tuple has the form:
# spectrogram, label, input_length, label_length
"""
Pad sequence to spectograms and labels by batch
A data tuple has the form:
spectrogram, label, input_length, label_length
"""

spectrograms = []
labels = []
Expand All @@ -68,22 +76,4 @@ def collate_fn(batch):
print(spectrograms.shape)
labels = torch.nn.utils.rnn.pad_sequence(labels, batch_first=True) #torch.stack(labels)

return spectrograms, labels, input_lengths, label_lengths







if __name__ == '__main__':
AUDIO_DIR = 'data/audio'
LABEL_DIR = 'data/label'

training_data = AudioDataset(AUDIO_DIR, LABEL_DIR)
# test_data = AudioDataset(AUDIO_DIR, LABEL_DIR)

print(len(training_data))

# train_dataloader = torch.utils.data.DataLoader(training_data, batch_size=64, shuffle=True)
# test_dataloader = torch.utils.data.DataLoader(test_data, batch_size=64, shuffle=True)
return spectrograms, labels, input_lengths, label_lengths

0 comments on commit 280ac0f

Please sign in to comment.