diff --git a/transcription-api/backends/backend.py b/transcription-api/backends/backend.py index 9153ce3..a170923 100644 --- a/transcription-api/backends/backend.py +++ b/transcription-api/backends/backend.py @@ -3,7 +3,7 @@ import numpy as np from faster_whisper.audio import decode_audio # type: ignore -SUPPORTED_MODELS = ["tiny", "tiny.en", "small", "small.en", "base", "base.en", "medium", "medium.en", "large-v2", "large-v3"] +SUPPORTED_MODELS = ["distil-large-v3", "distil-large-v2", "distil-medium.en", "turbo"] WordData = TypedDict( "WordData", {"word": str, "start": float | str, "end": float | str, "score": float} @@ -65,4 +65,4 @@ def transcribe(self, input: np.ndarray) -> list[Segment]: """ This should return word level transcription data. """ - raise NotImplementedError() \ No newline at end of file + raise NotImplementedError()