From d2cebf8b028afe7f25af732c5baa25b1db8e8d57 Mon Sep 17 00:00:00 2001
From: tcsenpai <dev@tcsenpai.com>
Date: Wed, 25 Dec 2024 20:38:25 +0100
Subject: [PATCH] added po_token support at runtime

---
 env.example          |  3 ++-
 src/main.py          | 62 +++++++++++++++++++++++++-------------------
 src/yt_audiophile.py | 19 ++++++++++----
 3 files changed, 51 insertions(+), 33 deletions(-)
diff --git a/env.example b/env.example
index 57a0aa7..fcbe546 100644
--- a/env.example
+++ b/env.example
@@ -3,4 +3,5 @@ OLLAMA_MODEL=llama3.1:8b
 YOUTUBE_API_KEY=your_youtube_api_key
 WHISPER_URL=http://localhost:8000/
 WHISPER_MODEL=Systran/faster-whisper-large-v3
-PASTEBIN_API_KEY=your_pastebin_api_key
\ No newline at end of file
+PASTEBIN_API_KEY=your_pastebin_api_key
+USE_PO_TOKEN=true 
\ No newline at end of file
diff --git a/src/main.py b/src/main.py
index 8ec1ce7..56f6758 100644
--- a/src/main.py
+++ b/src/main.py
@@ -252,7 +252,12 @@ def get_ollama_models(ollama_url):
 
 
 def summarize_video(
-    video_url, model, ollama_url, fallback_to_whisper=True, force_whisper=False
+    video_url,
+    model,
+    ollama_url,
+    fallback_to_whisper=True,
+    force_whisper=False,
+    use_po_token=None,
 ):
     video_id = None
     # Get the video id from the url if it's a valid youtube or invidious or any other url that contains a video id
@@ -284,7 +289,7 @@ def summarize_video(
             show_warning("Unable to fetch transcript. Trying to download audio...")
         try:
             print("Downloading audio...")
-            download_audio(video_url)
+            download_audio(video_url, use_po_token=use_po_token)
             show_info("Audio downloaded successfully!")
             show_warning("Starting transcription...it might take a while...")
             transcript = transcribe("downloads/output.m4a")
@@ -320,7 +325,12 @@ def summarize_video(
 
 
 def fix_transcript(
-    video_url, model, ollama_url, fallback_to_whisper=True, force_whisper=False
+    video_url,
+    model,
+    ollama_url,
+    fallback_to_whisper=True,
+    force_whisper=False,
+    use_po_token=None,
 ):
     video_id = None
     # Get the video id from the url if it's a valid youtube or invidious or any other url that contains a video id
@@ -352,7 +362,7 @@ def fix_transcript(
             show_warning("Unable to fetch transcript. Trying to download audio...")
         try:
             print("Downloading audio...")
-            download_audio(video_url)
+            download_audio(video_url, use_po_token=use_po_token)
             show_info("Audio downloaded successfully!")
             show_warning("Starting transcription...it might take a while...")
             transcript = transcribe("downloads/output.m4a")
@@ -437,31 +447,27 @@ def main():
             read_button = st.button("📖 Read", use_container_width=True)
 
     # Advanced settings in collapsible sections
-    with st.expander("⚙️ Advanced Settings"):
-        # Whisper Settings
-        st.subheader("🎤 Whisper Settings")
-        default_whisper_url = os.getenv("WHISPER_URL")
-        whisper_url = st.text_input(
-            "Whisper URL",
-            value=default_whisper_url,
-            placeholder="Enter Whisper URL",
-        )
-        if not whisper_url:
-            whisper_url = default_whisper_url
+    with st.expander("⚙️ Advanced Settings", expanded=False):
+        col1, col2 = st.columns(2)
 
-        whisper_model = os.getenv("WHISPER_MODEL")
-        if not whisper_model:
-            whisper_model = "Systran/faster-whisper-large-v3"
-        st.caption(f"Current model: {whisper_model}")
+        with col1:
+            fallback_to_whisper = st.checkbox(
+                "Fallback to Whisper",
+                value=True,
+                help="If no transcript is available, try to generate one using Whisper",
+            )
+            force_whisper = st.checkbox(
+                "Force Whisper",
+                value=False,
+                help="Always use Whisper for transcription",
+            )
 
-        st.markdown("<br>", unsafe_allow_html=True)  # Add some spacing
-
-        # Whisper Options
-        adv_col1, adv_col2 = st.columns(2)
-        with adv_col1:
-            force_whisper = st.checkbox("Force Whisper", value=False)
-        with adv_col2:
-            fallback_to_whisper = st.checkbox("Fallback to Whisper", value=True)
+        with col2:
+            use_po_token = st.checkbox(
+                "Use PO Token",
+                value=get_po_token_setting(),  # Default from environment
+                help="Use PO token for YouTube authentication (helps bypass restrictions)",
+            )
 
     if (summarize_button or read_button) and video_url:
         if read_button:
@@ -472,6 +478,7 @@ def main():
                 ollama_url,
                 fallback_to_whisper=fallback_to_whisper,
                 force_whisper=force_whisper,
+                use_po_token=use_po_token,
             )
 
             # Display results
@@ -502,6 +509,7 @@ def main():
                 ollama_url,
                 fallback_to_whisper=fallback_to_whisper,
                 force_whisper=force_whisper,
+                use_po_token=use_po_token,
             )
 
             # Video Information
diff --git a/src/yt_audiophile.py b/src/yt_audiophile.py
index 2663b91..494af65 100644
--- a/src/yt_audiophile.py
+++ b/src/yt_audiophile.py
@@ -1,20 +1,29 @@
 from pytubefix import YouTube
 from pytubefix.cli import on_progress
+from dotenv import load_dotenv
+import os
 
-"""e.g.
-https://www.youtube.com/watch?v=vwTDiLH6mqg
-"""
+load_dotenv()
 
 
-def download_audio(url):
+def get_po_token_setting():
+    env_setting = os.getenv("USE_PO_TOKEN", "true").lower() == "true"
+    return env_setting
+
+
+def download_audio(url, use_po_token=None):
     try:
+        # If use_po_token is not provided, use the environment variable
+        if use_po_token is None:
+            use_po_token = get_po_token_setting()
+
         # Create YouTube object with bot detection bypass
         yt = YouTube(
             url,
             on_progress_callback=on_progress,
             use_oauth=True,
             allow_oauth_cache=True,
-            use_po_token=True,  # Add this to bypass bot detection
+            use_po_token=use_po_token,  # Now configurable
         )
 
         # Get audio stream