Skip to content

Commit

Permalink
🐛 Fix wrong cache dir in speech_recognition_dataset.py
Browse files Browse the repository at this point in the history
  • Loading branch information
arxyzan committed Feb 7, 2024
1 parent 0e59778 commit d7dadd6
Showing 1 changed file with 2 additions and 2 deletions.
4 changes: 2 additions & 2 deletions hezar/data/datasets/speech_recognition_dataset.py
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,7 @@

from dataclasses import dataclass

from datasets import Audio, load_dataset, load_from_disk
from datasets import Audio, load_dataset

from .dataset import Dataset
from ..data_collators import SpeechRecognitionDataCollator
Expand Down Expand Up @@ -51,7 +51,7 @@ def __init__(self, config: SpeechRecognitionDatasetConfig, split=None, **kwargs)
)

def _load(self, split):
data = load_dataset(self.config.path, split=split)
data = load_dataset(self.config.path, split=split, cache_dir=self.cache_dir)
data = data.cast_column(self.config.audio_column, Audio(sampling_rate=self.config.sampling_rate))
return data

Expand Down

0 comments on commit d7dadd6

Please sign in to comment.