diff --git a/test/assets/LibriSpeech/dev-clean/1272/128104/1272-128104.trans.txt b/test/assets/LibriSpeech/dev-clean/1272/128104/1272-128104.trans.txt index bd06b7c4e2..57bf5c5086 100644 --- a/test/assets/LibriSpeech/dev-clean/1272/128104/1272-128104.trans.txt +++ b/test/assets/LibriSpeech/dev-clean/1272/128104/1272-128104.trans.txt @@ -1 +1 @@ -1272-128104-0000 THIS IS A TEST. +1272-128104-0000 MISTER QUILTER diff --git a/test/test_datasets.py b/test/test_datasets.py index 4d8cacbb4a..8f35a27b56 100644 --- a/test/test_datasets.py +++ b/test/test_datasets.py @@ -7,9 +7,12 @@ from torchaudio.datasets.vctk import VCTK from torchaudio.datasets.yesno import YESNO +import common_utils + class TestDatasets(unittest.TestCase): - path = "assets" + test_dirpath, test_dir = common_utils.create_temp_assets_dir() + path = os.path.join(test_dirpath, "assets") def test_yesno(self): data = YESNO(self.path, return_dict=True) diff --git a/torchaudio/datasets/librispeech.py b/torchaudio/datasets/librispeech.py index 59efe3fbc3..e9919ba1a3 100644 --- a/torchaudio/datasets/librispeech.py +++ b/torchaudio/datasets/librispeech.py @@ -1,7 +1,8 @@ import os -import torchaudio from torch.utils.data import Dataset + +import torchaudio from torchaudio.datasets.utils import ( download_url, extract_archive, @@ -19,7 +20,9 @@ def load_librispeech_item(fileid, path, ext_audio, ext_txt): file_text = speaker + "-" + chapter + ext_txt file_text = os.path.join(path, speaker, chapter, file_text) - file_audio = speaker + "-" + chapter + "-" + utterance + ext_audio + + fileid_audio = speaker + "-" + chapter + "-" + utterance + file_audio = fileid_audio + ext_audio file_audio = os.path.join(path, speaker, chapter, file_audio) # Load audio @@ -28,11 +31,11 @@ def load_librispeech_item(fileid, path, ext_audio, ext_txt): # Load text for line in open(file_text): fileid_text, content = line.strip().split(" ", 1) - if file_audio == fileid_text: + if fileid_audio == fileid_text: break else: # Translation not found - raise ValueError + raise FileNotFoundError("Translation not found for " + fileid_audio) return { "speaker_id": speaker,