From 1001a055db07bed3860ec3982e8c81a79eb28385 Mon Sep 17 00:00:00 2001 From: Jakub Kukul Date: Tue, 10 Oct 2023 10:20:58 +0200 Subject: [PATCH] Support language names in --language. --- whisperx/transcribe.py | 9 ++++++++- 1 file changed, 8 insertions(+), 1 deletion(-) diff --git a/whisperx/transcribe.py b/whisperx/transcribe.py index 8a8db13f..6f7a4ae4 100644 --- a/whisperx/transcribe.py +++ b/whisperx/transcribe.py @@ -111,8 +111,15 @@ def cli(): max_speakers: int = args.pop("max_speakers") print_progress: bool = args.pop("print_progress") + if args["language"] is not None: + args["language"] = args["language"].lower() + if args["language"] not in LANGUAGES: + if args["language"] in TO_LANGUAGE_CODE: + args["language"] = TO_LANGUAGE_CODE[args["language"]] + else: + raise ValueError(f"Unsupported language: {args['language']}") - if model_name.endswith(".en") and args["language"] not in {"en", "English"}: + if model_name.endswith(".en") and args["language"] != "en": if args["language"] is not None: warnings.warn( f"{model_name} is an English-only model but receipted '{args['language']}'; using English instead."