diff --git a/data/mozilla_deepspeech_wav2txt.py b/data/mozilla_deepspeech_wav2txt.py index 04c90019..d4a945c7 100644 --- a/data/mozilla_deepspeech_wav2txt.py +++ b/data/mozilla_deepspeech_wav2txt.py @@ -36,10 +36,10 @@ except ImportError: from pipes import quote -_global_modules_needed_by_name = ["deepspeech-gpu==0.6.1"] +_global_modules_needed_by_name = ["deepspeech-gpu==0.10.0a3"] #####Please fill up before usage -MODEL_PATH = "/home/dmitry/Desktop/DAI/deepspeech/deepspeech-0.6.1-models" +MODEL_PATH = "/home/dmitry/Desktop/DAI/deepspeech/deepspeech-0.10.0a3-models" beam_width = 500 # Beam width for the CTC decoder lm_alpha = 0.75 # Language model weight (lm_alpha) lm_beta = 1.85 # Word insertion bonus (lm_beta) @@ -67,7 +67,8 @@ def convert_samplerate(audio_path, desired_sample_rate): class MozillaDeepSpeechWav2Txt(BaseData): - _modules_needed_by_name = ["deepspeech-gpu==0.6.1"] + # Note: deepspeech-gpu only supports upto Python 3.9 + _modules_needed_by_name = ["deepspeech-gpu==0.10.0a3"] @staticmethod def create_data(X: dt.Frame = None) -> dt.Frame: