aboutsummaryrefslogtreecommitdiff
path: root/R2R/r2r/parsers/media/audio_parser.py
diff options
context:
space:
mode:
authorS. Solomon Darnell2025-03-28 21:52:21 -0500
committerS. Solomon Darnell2025-03-28 21:52:21 -0500
commit4a52a71956a8d46fcb7294ac71734504bb09bcc2 (patch)
treeee3dc5af3b6313e921cd920906356f5d4febc4ed /R2R/r2r/parsers/media/audio_parser.py
parentcc961e04ba734dd72309fb548a2f97d67d578813 (diff)
downloadgn-ai-4a52a71956a8d46fcb7294ac71734504bb09bcc2.tar.gz
two version of R2R are hereHEADmaster
Diffstat (limited to 'R2R/r2r/parsers/media/audio_parser.py')
-rwxr-xr-xR2R/r2r/parsers/media/audio_parser.py32
1 files changed, 32 insertions, 0 deletions
diff --git a/R2R/r2r/parsers/media/audio_parser.py b/R2R/r2r/parsers/media/audio_parser.py
new file mode 100755
index 00000000..8a7735e4
--- /dev/null
+++ b/R2R/r2r/parsers/media/audio_parser.py
@@ -0,0 +1,32 @@
+import os
+from typing import AsyncGenerator
+
+from r2r.base.parsers.base_parser import AsyncParser
+from r2r.parsers.media.openai_helpers import process_audio_with_openai
+
+
+class AudioParser(AsyncParser[bytes]):
+ """A parser for audio data."""
+
+ def __init__(
+ self, api_base: str = "https://api.openai.com/v1/audio/transcriptions"
+ ):
+ self.api_base = api_base
+ self.openai_api_key = os.environ.get("OPENAI_API_KEY")
+ if not self.openai_api_key:
+ raise ValueError(
+ "Error, environment variable `OPENAI_API_KEY` is required to run `AudioParser`."
+ )
+
+ async def ingest(self, data: bytes) -> AsyncGenerator[str, None]:
+ """Ingest audio data and yield a transcription."""
+ temp_audio_path = "temp_audio.wav"
+ with open(temp_audio_path, "wb") as f:
+ f.write(data)
+ try:
+ transcription_text = process_audio_with_openai(
+ open(temp_audio_path, "rb"), self.openai_api_key
+ )
+ yield transcription_text
+ finally:
+ os.remove(temp_audio_path)