diff --git a/montreal_forced_aligner/online/transcription.py b/montreal_forced_aligner/online/transcription.py index cf07b198..30f96af9 100644 --- a/montreal_forced_aligner/online/transcription.py +++ b/montreal_forced_aligner/online/transcription.py @@ -4,7 +4,6 @@ import typing import numpy as np -import torch from _kalpy.fstext import ConstFst from _kalpy.matrix import DoubleMatrix, FloatMatrix from kalpy.data import Segment @@ -129,6 +128,8 @@ def transcribe_utterance_online_speechbrain( raise Exception( "Could not import speechbrain, please ensure it is installed via `pip install speechbrain`" ) + import torch + segment = utterance.segment waveform = segment.load_audio() waveform = model.audio_normalizer(waveform, 16000).unsqueeze(0)