Spaces:

natasa365
/

whisper.cpp

Running

App Files Files Community

contractorwolf commited on Jan 13, 2024

Commit

d600e4c

unverified ·

1 Parent(s): 0e9101f

examples : add python example for transcription (#1744)

Browse files

* rebase and add simple python interface

* moved python files to examples/python

Files changed (2) hide show

examples/python/test_whisper_processor.py +7 -0
examples/python/whisper_processor.py +54 -0

examples/python/test_whisper_processor.py ADDED Viewed

	@@ -0,0 +1,7 @@

+import whisper_processor
+try:
+    result = whisper_processor.process_audio("./audio/wake_word_detected16k.wav", "base.en")
+    print(result)
+except Exception as e:
+    print(f"Error: {e}")

examples/python/whisper_processor.py ADDED Viewed

	@@ -0,0 +1,54 @@

+import subprocess
+import sys
+import os
+def process_audio(wav_file, model_name="base.en"):
+    """
+    Processes an audio file using a specified model and returns the processed string.
+    :param wav_file: Path to the WAV file
+    :param model_name: Name of the model to use
+    :return: Processed string output from the audio processing
+    :raises: Exception if an error occurs during processing
+    """
+    model = f"./models/ggml-{model_name}.bin"
+    # Check if the file exists
+    if not os.path.exists(model):
+        raise FileNotFoundError(f"Model file not found: {model} \n\nDownload a model with this command:\n\n> bash ./models/download-ggml-model.sh {model_name}\n\n")
+    if not os.path.exists(wav_file):
+        raise FileNotFoundError(f"WAV file not found: {wav_file}")
+    full_command = f"./main -m {model} -f {wav_file} -np -nt"
+    # Execute the command
+    process = subprocess.Popen(full_command, shell=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
+    # Get the output and error (if any)
+    output, error = process.communicate()
+    if error:
+        raise Exception(f"Error processing audio: {error.decode('utf-8')}")
+    # Process and return the output string
+    decoded_str = output.decode('utf-8').strip()
+    processed_str = decoded_str.replace('[BLANK_AUDIO]', '').strip()
+    return processed_str
+def main():
+    if len(sys.argv) >= 2:
+        wav_file = sys.argv[1]
+        model_name = sys.argv[2] if len(sys.argv) == 3 else "base.en"
+        try:
+            result = process_audio(wav_file, model_name)
+            print(result)
+        except Exception as e:
+            print(f"Error: {e}")
+    else:
+        print("Usage: python whisper_processor.py <wav_file> [<model_name>]")
+if __name__ == "__main__":
+    main()