whisper.cpp/examples/python/whisper_processor.py

import subprocess
import sys
import os

def process_audio(wav_file, model_name="base.en"):
    """
    Processes an audio file using a specified model and returns the processed string.

    :param wav_file: Path to the WAV file
    :param model_name: Name of the model to use
    :return: Processed string output from the audio processing
    :raises: Exception if an error occurs during processing
    """

    model = f"./models/ggml-{model_name}.bin"

    # Check if the file exists
    if not os.path.exists(model):
        raise FileNotFoundError(f"Model file not found: {model} \n\nDownload a model with this command:\n\n> bash ./models/download-ggml-model.sh {model_name}\n\n")

    if not os.path.exists(wav_file):
        raise FileNotFoundError(f"WAV file not found: {wav_file}")

    full_command = f"./main -m {model} -f {wav_file} -nt"

    # Execute the command
    process = subprocess.Popen(full_command, shell=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE)

    # Get the output and error (if any)
    output, error = process.communicate()

    if error:
        raise Exception(f"Error processing audio: {error.decode('utf-8')}")

    # Process and return the output string
    decoded_str = output.decode('utf-8').strip()
    processed_str = decoded_str.replace('[BLANK_AUDIO]', '').strip()

    return processed_str

def main():
    if len(sys.argv) >= 2:
        wav_file = sys.argv[1]
        model_name = sys.argv[2] if len(sys.argv) == 3 else "base.en"
        try:
            result = process_audio(wav_file, model_name)
            print(result)
        except Exception as e:
            print(f"Error: {e}")
    else:
        print("Usage: python whisper_processor.py <wav_file> [<model_name>]")

if __name__ == "__main__":
    main()
examples : add python example for transcription (#1744) * rebase and add simple python interface * moved python files to examples/python 2024-01-13 17:37:18 +00:00			`import subprocess`
			`import sys`
			`import os`

			`def process_audio(wav_file, model_name="base.en"):`
			`"""`
			`Processes an audio file using a specified model and returns the processed string.`

			`:param wav_file: Path to the WAV file`
			`:param model_name: Name of the model to use`
			`:return: Processed string output from the audio processing`
			`:raises: Exception if an error occurs during processing`
			`"""`

			`model = f"./models/ggml-{model_name}.bin"`

			`# Check if the file exists`
			`if not os.path.exists(model):`
			`raise FileNotFoundError(f"Model file not found: {model} \n\nDownload a model with this command:\n\n> bash ./models/download-ggml-model.sh {model_name}\n\n")`

			`if not os.path.exists(wav_file):`
			`raise FileNotFoundError(f"WAV file not found: {wav_file}")`

readme : remove invalid flag from Python example (#2396) * Update README.md Fix broken C-style API link * Update whisper_processor.py Update examples/python/whisper_processor.py to remove nonexistent flag "-np" from subprocess.Popen call. * Add pywhispercpp to the Pybind11 Python wrapper list abdeladim-s/pywhispercpp wasn't added to the list / was removed at some point (?) It was referenced in issue #9, so I feel like it's worthy of being added as it's the first if not one of the first Python wrappers for whisper.cpp 2024-08-30 11:00:38 +00:00			`full_command = f"./main -m {model} -f {wav_file} -nt"`
examples : add python example for transcription (#1744) * rebase and add simple python interface * moved python files to examples/python 2024-01-13 17:37:18 +00:00
			`# Execute the command`
			`process = subprocess.Popen(full_command, shell=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE)`

			`# Get the output and error (if any)`
			`output, error = process.communicate()`

			`if error:`
			`raise Exception(f"Error processing audio: {error.decode('utf-8')}")`

			`# Process and return the output string`
			`decoded_str = output.decode('utf-8').strip()`
			`processed_str = decoded_str.replace('[BLANK_AUDIO]', '').strip()`

			`return processed_str`

			`def main():`
			`if len(sys.argv) >= 2:`
			`wav_file = sys.argv[1]`
			`model_name = sys.argv[2] if len(sys.argv) == 3 else "base.en"`
			`try:`
			`result = process_audio(wav_file, model_name)`
			`print(result)`
			`except Exception as e:`
			`print(f"Error: {e}")`
			`else:`
			`print("Usage: python whisper_processor.py <wav_file> [<model_name>]")`

			`if __name__ == "__main__":`
			`main()`