Spaces:

nnilayy
/

yt-audio-dl

Building

App Files Files Community

nnilayy commited on Jan 22

Commit

bd09639

1 Parent(s): a17935c

Add po-token logic

Browse files

Files changed (3) hide show

Dockerfile +15 -5
app.py +70 -11
tokens.json +1 -0

Dockerfile CHANGED Viewed

@@ -1,7 +1,17 @@
-# Use Python 3.10 base image
 FROM python:3.10-slim
-# Create a non-root user for security
 RUN useradd -m -u 1000 user
 USER user
 ENV PATH="/home/user/.local/bin:${PATH}"
@@ -9,15 +19,15 @@ ENV PATH="/home/user/.local/bin:${PATH}"
 # Set working directory
 WORKDIR /app
-# Install Python dependencies first for layer caching
 COPY --chown=user requirements.txt .
 RUN pip install --no-cache-dir --upgrade -r requirements.txt
 # Copy application code
 COPY --chown=user . .
-# Expose Gradio's default port
 EXPOSE 7860
-# Launch the application with Spaces-compatible settings
 CMD ["python", "app.py"]

+# Use Python 3.10 slim base image
 FROM python:3.10-slim
+# Install system dependencies
+RUN apt-get update && apt-get install -y \
+    curl \
+    gnupg \
+    && rm -rf /var/lib/apt/lists/*
+# Install Node.js for initial PoToken generation
+RUN curl -fsSL https://deb.nodesource.com/setup_20.x | bash - \
+    && apt-get install -y nodejs
+# Create non-root user
 RUN useradd -m -u 1000 user
 USER user
 ENV PATH="/home/user/.local/bin:${PATH}"
 # Set working directory
 WORKDIR /app
+# Copy requirements first for better caching
 COPY --chown=user requirements.txt .
 RUN pip install --no-cache-dir --upgrade -r requirements.txt
 # Copy application code
 COPY --chown=user . .
+# Expose Gradio port
 EXPOSE 7860
+# Start application
 CMD ["python", "app.py"]

app.py CHANGED Viewed

@@ -2,35 +2,86 @@ import gradio as gr
 from pytubefix import YouTube
 import tempfile
 import base64
 from io import BytesIO
 def download_audio(url):
     try:
-        # Initialize YouTube object
-        yt = YouTube(url, 'WEB')
-        title = yt.title
-        # Get best audio stream
         audio_stream = yt.streams.filter(only_audio=True).order_by('abr').desc().first()
         if not audio_stream:
             return ["Error: No audio stream found", None, None]
-        # Download to in-memory buffer
         buffer = BytesIO()
         audio_stream.stream_to_buffer(buffer)
         buffer.seek(0)
-        # Create temporary file
         with tempfile.NamedTemporaryFile(suffix=".mp3", delete=False) as tmp_file:
             tmp_file.write(buffer.read())
             tmp_path = tmp_file.name
-        # Create HTML audio player with base64 encoding
         with open(tmp_path, "rb") as f:
             audio_bytes = f.read()
         audio_base64 = base64.b64encode(audio_bytes).decode("utf-8")
         audio_html = f"""
-        <audio controls autoplay style="width: 100%">
             <source src="data:audio/mp3;base64,{audio_base64}" type="audio/mp3">
             Your browser does not support the audio element.
         </audio>
@@ -41,10 +92,18 @@ def download_audio(url):
             tmp_path,
             audio_html
         ]
     except Exception as e:
         return [f"Error: {str(e)}", None, None]
 with gr.Blocks(title="YouTube Audio Downloader") as demo:
     gr.Markdown("# YouTube Audio Downloader")
@@ -78,5 +137,5 @@ if __name__ == "__main__":
         server_name="0.0.0.0",
         server_port=7860,
         show_error=True,
-        allowed_paths=["*"]
     )

 from pytubefix import YouTube
 import tempfile
 import base64
+import os
+import json
+import logging
 from io import BytesIO
+# Configure logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+TOKEN_FILE = "tokens.json"
+def get_or_create_tokens():
+    """Get cached tokens or create new ones with Node.js"""
+    try:
+        if os.path.exists(TOKEN_FILE):
+            with open(TOKEN_FILE) as f:
+                return json.load(f)
+        # Generate new tokens using dummy request
+        logger.info("Generating new YouTube tokens...")
+        yt = YouTube("https://www.youtube.com/watch?v=dQw4w9WgXcQ", 'WEB')
+        tokens = {
+            "po_token": yt.pot,
+            "visitor_data": yt._visitor_data
+        }
+        with open(TOKEN_FILE, 'w') as f:
+            json.dump(tokens, f)
+        return tokens
+    except Exception as e:
+        logger.error(f"Token generation failed: {str(e)}")
+        raise
+def refresh_tokens():
+    """Force refresh tokens by deleting existing file"""
+    try:
+        if os.path.exists(TOKEN_FILE):
+            os.remove(TOKEN_FILE)
+        return get_or_create_tokens()
+    except Exception as e:
+        logger.error(f"Token refresh failed: {str(e)}")
+        raise
+# Load initial tokens
+tokens = get_or_create_tokens()
 def download_audio(url):
+    global tokens
     try:
+        # Try with current tokens
+        yt = YouTube(
+            url,
+            use_po_token=True,
+            po_token=tokens["po_token"],
+            visitor_data=tokens["visitor_data"],
+            allow_oauth_cache=True
+        )
+        title = yt.title
         audio_stream = yt.streams.filter(only_audio=True).order_by('abr').desc().first()
         if not audio_stream:
             return ["Error: No audio stream found", None, None]
+        # Download to memory
         buffer = BytesIO()
         audio_stream.stream_to_buffer(buffer)
         buffer.seek(0)
+        # Create temp file
         with tempfile.NamedTemporaryFile(suffix=".mp3", delete=False) as tmp_file:
             tmp_file.write(buffer.read())
             tmp_path = tmp_file.name
+        # Create HTML player
         with open(tmp_path, "rb") as f:
             audio_bytes = f.read()
         audio_base64 = base64.b64encode(audio_bytes).decode("utf-8")
         audio_html = f"""
+        <audio controls style="width: 100%">
             <source src="data:audio/mp3;base64,{audio_base64}" type="audio/mp3">
             Your browser does not support the audio element.
         </audio>
             tmp_path,
             audio_html
         ]
     except Exception as e:
+        if "bot" in str(e).lower():
+            logger.warning("Bot detected - refreshing tokens...")
+            try:
+                tokens = refresh_tokens()
+                return download_audio(url)  # Retry with new tokens
+            except Exception as retry_error:
+                return [f"Error: Failed after token refresh - {str(retry_error)}", None, None]
         return [f"Error: {str(e)}", None, None]
+# Gradio interface
 with gr.Blocks(title="YouTube Audio Downloader") as demo:
     gr.Markdown("# YouTube Audio Downloader")
         server_name="0.0.0.0",
         server_port=7860,
         show_error=True,
+        allowed_paths=["/"]
     )

tokens.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"po_token": "MngL5Ew7WfF2bAvY5UI1JXOsEEAgc9Q1A582budFuOgRPOrmvAHa5B8jTFFrOscLs_kEw7Q_TOtWdfwFBFmtUX3jSJZvDPd6aqSKJ6FYVG1zt7izKy0Og3wtvfS8WKvifZT1bcKu8GDNEHyB69klgkYzo0FvdhWFp0o=", "visitor_data": "CgtGaTQ1bWhySkVQayilwMG8BjIKCgJJThIEGgAgYA%3D%3D"}