mirror of
https://github.com/ggerganov/whisper.cpp.git
synced 2025-01-04 03:34:08 +00:00
9600fc3eb1
* Update README.md Fix broken C-style API link * Update whisper_processor.py Update examples/python/whisper_processor.py to remove nonexistent flag "-np" from subprocess.Popen call. * Add pywhispercpp to the Pybind11 Python wrapper list abdeladim-s/pywhispercpp wasn't added to the list / was removed at some point (?) It was referenced in issue #9, so I feel like it's worthy of being added as it's the first if not one of the first Python wrappers for whisper.cpp
55 lines
1.7 KiB
Python
55 lines
1.7 KiB
Python
import subprocess
|
|
import sys
|
|
import os
|
|
|
|
def process_audio(wav_file, model_name="base.en"):
|
|
"""
|
|
Processes an audio file using a specified model and returns the processed string.
|
|
|
|
:param wav_file: Path to the WAV file
|
|
:param model_name: Name of the model to use
|
|
:return: Processed string output from the audio processing
|
|
:raises: Exception if an error occurs during processing
|
|
"""
|
|
|
|
model = f"./models/ggml-{model_name}.bin"
|
|
|
|
# Check if the file exists
|
|
if not os.path.exists(model):
|
|
raise FileNotFoundError(f"Model file not found: {model} \n\nDownload a model with this command:\n\n> bash ./models/download-ggml-model.sh {model_name}\n\n")
|
|
|
|
if not os.path.exists(wav_file):
|
|
raise FileNotFoundError(f"WAV file not found: {wav_file}")
|
|
|
|
full_command = f"./main -m {model} -f {wav_file} -nt"
|
|
|
|
# Execute the command
|
|
process = subprocess.Popen(full_command, shell=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
|
|
|
|
# Get the output and error (if any)
|
|
output, error = process.communicate()
|
|
|
|
if error:
|
|
raise Exception(f"Error processing audio: {error.decode('utf-8')}")
|
|
|
|
# Process and return the output string
|
|
decoded_str = output.decode('utf-8').strip()
|
|
processed_str = decoded_str.replace('[BLANK_AUDIO]', '').strip()
|
|
|
|
return processed_str
|
|
|
|
def main():
|
|
if len(sys.argv) >= 2:
|
|
wav_file = sys.argv[1]
|
|
model_name = sys.argv[2] if len(sys.argv) == 3 else "base.en"
|
|
try:
|
|
result = process_audio(wav_file, model_name)
|
|
print(result)
|
|
except Exception as e:
|
|
print(f"Error: {e}")
|
|
else:
|
|
print("Usage: python whisper_processor.py <wav_file> [<model_name>]")
|
|
|
|
if __name__ == "__main__":
|
|
main()
|