about summary refs log tree commit diff
path: root/R2R/r2r/parsers/media/audio_parser.py
diff options
context:
space:
mode:
authorS. Solomon Darnell2025-03-28 21:52:21 -0500
committerS. Solomon Darnell2025-03-28 21:52:21 -0500
commit4a52a71956a8d46fcb7294ac71734504bb09bcc2 (patch)
treeee3dc5af3b6313e921cd920906356f5d4febc4ed /R2R/r2r/parsers/media/audio_parser.py
parentcc961e04ba734dd72309fb548a2f97d67d578813 (diff)
downloadgn-ai-4a52a71956a8d46fcb7294ac71734504bb09bcc2.tar.gz
two version of R2R are here HEAD master
Diffstat (limited to 'R2R/r2r/parsers/media/audio_parser.py')
-rwxr-xr-xR2R/r2r/parsers/media/audio_parser.py32
1 files changed, 32 insertions, 0 deletions
diff --git a/R2R/r2r/parsers/media/audio_parser.py b/R2R/r2r/parsers/media/audio_parser.py
new file mode 100755
index 00000000..8a7735e4
--- /dev/null
+++ b/R2R/r2r/parsers/media/audio_parser.py
@@ -0,0 +1,32 @@
+import os
+from typing import AsyncGenerator
+
+from r2r.base.parsers.base_parser import AsyncParser
+from r2r.parsers.media.openai_helpers import process_audio_with_openai
+
+
+class AudioParser(AsyncParser[bytes]):
+    """A parser for audio data."""
+
+    def __init__(
+        self, api_base: str = "https://api.openai.com/v1/audio/transcriptions"
+    ):
+        self.api_base = api_base
+        self.openai_api_key = os.environ.get("OPENAI_API_KEY")
+        if not self.openai_api_key:
+            raise ValueError(
+                "Error, environment variable `OPENAI_API_KEY` is required to run `AudioParser`."
+            )
+
+    async def ingest(self, data: bytes) -> AsyncGenerator[str, None]:
+        """Ingest audio data and yield a transcription."""
+        temp_audio_path = "temp_audio.wav"
+        with open(temp_audio_path, "wb") as f:
+            f.write(data)
+        try:
+            transcription_text = process_audio_with_openai(
+                open(temp_audio_path, "rb"), self.openai_api_key
+            )
+            yield transcription_text
+        finally:
+            os.remove(temp_audio_path)