max-rousseau · max-rousseau · Jul 27, 2024 · Jul 27, 2024 · Jul 27, 2024 · Jul 27, 2024
diff --git a/youtube_transcriber.py b/youtube_transcriber.py
@@ -2,12 +2,38 @@
 import os
 from pytube import YouTube
 from openai import OpenAI
+import json
+
+
+class OpenAIClient:
+    _shared_state = {}
+
+    def __init__(self, api_key):
+        self.__dict__ = self._shared_state
+        self._api_key = api_key
+        self._client = None
+
+    @property
+    def client(self):
+        if self._client is None:
+            self._client = OpenAI(api_key=self._api_key)
+        return self._client
+
+    def set_api_key(self, api_key):
+        self._api_key = api_key
+        self._client = None  # Reset client to reinitialize with new API key if needed
 
 
 @click.command()
 @click.argument("url")
 @click.option("--api-key", envvar="OPENAI_API_KEY", help="OpenAI API Key")
-def transcribe(url, api_key):
+@click.option(
+    "--ai-audio-model", default="whisper-1", help="OpenAI audio transcription model"
+)
+@click.option(
+    "--ai-chat-model", default="gpt-4", help="OpenAI AI chat model for post-processing"
+)
+def transcribe(url, api_key, ai_audio_model, ai_chat_model):
     """Transcribe audio from a YouTube video."""
     if not api_key:
         raise click.ClickException(
@@ -20,12 +46,13 @@ def transcribe(url, api_key):
     audio_filename = audio_stream.download(filename=audio_stream.default_filename)
 
     try:
-        # Transcribe audio using OpenAI Whisper API
-        client = OpenAI(api_key=api_key)
+        # Initialize OpenAI client
+        openai_client = OpenAIClient(api_key)
 
+        # Transcribe audio using OpenAI Whisper API
         with open(audio_filename, "rb") as audio_file:
-            transcription = client.audio.transcriptions.create(
-                model="whisper-1", file=audio_file
+            transcription = openai_client.client.audio.transcriptions.create(
+                model=ai_audio_model, file=audio_file
             )
             print(transcription.text)
 
@@ -34,10 +61,36 @@ def transcribe(url, api_key):
             f.write(transcription.text)
 
         click.echo(f"Transcript saved to transcript.md")
+
+        # Ask user if they want to post-process the transcript
+        if click.confirm("Do you want to post-process the transcript with AI?"):
+            transcript_postprocess(transcription.text, ai_chat_model, openai_client)
     finally:
         # Clean up temporary audio file
         os.remove(audio_filename)
 
 
+def transcript_postprocess(transcript, ai_model, openai_client):
+    """Post-process the transcript using specified OpenAI model."""
+    user_prompt = click.prompt("What would you like to do with the transcript?")
+
+    system_message = (
+        "You are a helpful assistant that can analyze and process video transcripts."
+    )
+    user_message = f"Please review the following transcript and respond to the user's request below.\n\n```{transcript}```\n\nUser's request: {user_prompt}"
+
+    response = openai_client.client.chat.completions.create(
+        model=ai_model,
+        messages=[
+            {"role": "system", "content": system_message},
+            {"role": "user", "content": user_message},
+        ],
+        max_tokens=4096,
+    )
+
+    print("\nAI Response:")
+    print(response.choices[0].message.content)
+
+
 if __name__ == "__main__":
     transcribe()