mirror of
https://github.com/SevaSk/ecoute.git
synced 2024-12-25 23:21:07 +00:00
43 lines
1.5 KiB
Python
43 lines
1.5 KiB
Python
|
from __future__ import annotations
|
||
|
|
||
|
import os
|
||
|
from io import BytesIO
|
||
|
|
||
|
from speech_recognition.audio import AudioData
|
||
|
from speech_recognition.exceptions import SetupError
|
||
|
|
||
|
|
||
|
def recognize_whisper_api(
|
||
|
recognizer,
|
||
|
audio_data: "AudioData",
|
||
|
*,
|
||
|
model: str = "whisper-1",
|
||
|
api_key: str | None = None,
|
||
|
):
|
||
|
"""
|
||
|
Performs speech recognition on ``audio_data`` (an ``AudioData`` instance), using the OpenAI Whisper API.
|
||
|
|
||
|
This function requires an OpenAI account; visit https://platform.openai.com/signup, then generate API Key in `User settings <https://platform.openai.com/account/api-keys>`__.
|
||
|
|
||
|
Detail: https://platform.openai.com/docs/guides/speech-to-text
|
||
|
|
||
|
Raises a ``speech_recognition.exceptions.SetupError`` exception if there are any issues with the openai installation, or the environment variable is missing.
|
||
|
"""
|
||
|
if not isinstance(audio_data, AudioData):
|
||
|
raise ValueError("``audio_data`` must be an ``AudioData`` instance")
|
||
|
if api_key is None and os.environ.get("OPENAI_API_KEY") is None:
|
||
|
raise SetupError("Set environment variable ``OPENAI_API_KEY``")
|
||
|
|
||
|
try:
|
||
|
import openai
|
||
|
except ImportError:
|
||
|
raise SetupError(
|
||
|
"missing openai module: ensure that openai is set up correctly."
|
||
|
)
|
||
|
|
||
|
wav_data = BytesIO(audio_data.get_wav_data())
|
||
|
wav_data.name = "SpeechRecognition_audio.wav"
|
||
|
|
||
|
transcript = openai.Audio.transcribe(model, wav_data, api_key=api_key)
|
||
|
return transcript["text"]
|