From 6343978c5fbc557267a3b0b725bd829a0f83af6f Mon Sep 17 00:00:00 2001
From: Peifan Li <frank.li.oxygen@gmail.com>
Date: Tue, 9 Dec 2025 22:06:31 -0500
Subject: [PATCH] feat: Add yt-dlp download functionality and helpers

---
 .../services/downloaders/YtDlpDownloader.ts   | 1069 ++++++++++-------
 build-and-push.sh                             |    4 +-
 2 files changed, 658 insertions(+), 415 deletions(-)
diff --git a/backend/src/services/downloaders/YtDlpDownloader.ts b/backend/src/services/downloaders/YtDlpDownloader.ts
index d728180..3cd5704 100644
--- a/backend/src/services/downloaders/YtDlpDownloader.ts
+++ b/backend/src/services/downloaders/YtDlpDownloader.ts
@@ -1,451 +1,694 @@
 import axios from "axios";
+import { spawn } from "child_process";
 import fs from "fs-extra";
 import path from "path";
-import youtubedl from "youtube-dl-exec";
 import { IMAGES_DIR, SUBTITLES_DIR, VIDEOS_DIR } from "../../config/paths";
 import { formatVideoFilename } from "../../utils/helpers";
 import * as storageService from "../storageService";
 import { Video } from "../storageService";
 
 const YT_DLP_PATH = process.env.YT_DLP_PATH || "yt-dlp";
-const PROVIDER_SCRIPT = process.env.BGUTIL_SCRIPT_PATH || path.join(process.cwd(), "bgutil-ytdlp-pot-provider/server/build/generate_once.js");
+const PROVIDER_SCRIPT =
+  process.env.BGUTIL_SCRIPT_PATH ||
+  path.join(
+    process.cwd(),
+    "bgutil-ytdlp-pot-provider/server/build/generate_once.js"
+  );
+
+/**
+ * Convert camelCase flag names to kebab-case CLI arguments
+ */
+function convertFlagToArg(flag: string): string {
+  return `--${flag.replace(/([A-Z])/g, "-$1").toLowerCase()}`;
+}
+
+/**
+ * Convert flags object to yt-dlp CLI arguments array
+ */
+function flagsToArgs(flags: Record<string, any>): string[] {
+  const args: string[] = [];
+
+  for (const [key, value] of Object.entries(flags)) {
+    if (value === undefined || value === null) {
+      continue;
+    }
+
+    // Handle special cases
+    if (key === "extractorArgs") {
+      // Support semicolon-separated extractor args (e.g., "youtube:key=value;other:key=value")
+      if (typeof value === "string" && value.includes(";")) {
+        const parts = value.split(";");
+        for (const part of parts) {
+          if (part.trim()) {
+            args.push("--extractor-args", part.trim());
+          }
+        }
+      } else {
+        args.push("--extractor-args", value);
+      }
+      continue;
+    }
+
+    if (key === "addHeader") {
+      // addHeader is an array of "key:value" strings
+      if (Array.isArray(value)) {
+        for (const header of value) {
+          args.push("--add-header", header);
+        }
+      } else {
+        args.push("--add-header", value);
+      }
+      continue;
+    }
+
+    // Convert camelCase to kebab-case
+    const argName = convertFlagToArg(key);
+
+    if (typeof value === "boolean") {
+      if (value) {
+        args.push(argName);
+      }
+    } else if (typeof value === "string" || typeof value === "number") {
+      args.push(argName, String(value));
+    } else if (Array.isArray(value)) {
+      // For arrays, join with comma or repeat the flag
+      args.push(argName, value.join(","));
+    }
+  }
+
+  return args;
+}
+
+/**
+ * Execute yt-dlp with JSON output and return parsed result
+ */
+async function executeYtDlpJson(
+  url: string,
+  flags: Record<string, any> = {}
+): Promise<any> {
+  const args = [
+    "--dump-single-json",
+    "--no-warnings",
+    ...flagsToArgs(flags),
+    url,
+  ];
+
+  console.log(`Executing: ${YT_DLP_PATH} ${args.join(" ")}`);
+
+  return new Promise<any>((resolve, reject) => {
+    const subprocess = spawn(YT_DLP_PATH, args, {
+      stdio: ["ignore", "pipe", "pipe"],
+    });
+
+    let stdout = "";
+    let stderr = "";
+
+    subprocess.stdout?.on("data", (data: Buffer) => {
+      stdout += data.toString();
+    });
+
+    subprocess.stderr?.on("data", (data: Buffer) => {
+      stderr += data.toString();
+    });
+
+    subprocess.on("close", (code) => {
+      if (code !== 0) {
+        const error = new Error(`yt-dlp process exited with code ${code}`);
+        (error as any).stderr = stderr;
+        reject(error);
+        return;
+      }
+
+      if (
+        stderr &&
+        !stderr.includes("[download]") &&
+        !stderr.includes("[info]")
+      ) {
+        console.warn("yt-dlp stderr:", stderr);
+      }
+
+      try {
+        resolve(JSON.parse(stdout));
+      } catch (parseError) {
+        console.error("Failed to parse yt-dlp JSON output:", parseError);
+        console.error("Output:", stdout);
+        reject(new Error("Failed to parse yt-dlp output as JSON"));
+      }
+    });
+
+    subprocess.on("error", (error) => {
+      reject(error);
+    });
+  });
+}
+
+/**
+ * Execute yt-dlp with spawn for progress tracking
+ * Returns a subprocess-like object with kill() method
+ */
+function executeYtDlpSpawn(
+  url: string,
+  flags: Record<string, any> = {}
+): {
+  stdout: NodeJS.ReadableStream | null;
+  stderr: NodeJS.ReadableStream | null;
+  kill: (signal?: NodeJS.Signals) => boolean;
+  then: (
+    onFulfilled?: (value: void) => void | Promise<void>,
+    onRejected?: (reason: any) => void | Promise<void>
+  ) => Promise<void>;
+} {
+  const args = [...flagsToArgs(flags), url];
+
+  console.log(`Spawning: ${YT_DLP_PATH} ${args.join(" ")}`);
+
+  const subprocess = spawn(YT_DLP_PATH, args, {
+    stdio: ["ignore", "pipe", "pipe"],
+  });
+
+  let resolved = false;
+  let rejected = false;
+  let resolveFn: (() => void) | null = null;
+  let rejectFn: ((error: Error) => void) | null = null;
+
+  const promise = new Promise<void>((resolve, reject) => {
+    resolveFn = resolve;
+    rejectFn = reject;
+
+    subprocess.on("close", (code) => {
+      if (code === 0) {
+        if (!resolved && !rejected) {
+          resolved = true;
+          resolve();
+        }
+      } else {
+        if (!resolved && !rejected) {
+          rejected = true;
+          reject(new Error(`yt-dlp process exited with code ${code}`));
+        }
+      }
+    });
+
+    subprocess.on("error", (error) => {
+      if (!resolved && !rejected) {
+        rejected = true;
+        reject(error);
+      }
+    });
+  });
+
+  return {
+    stdout: subprocess.stdout,
+    stderr: subprocess.stderr,
+    kill: (signal?: NodeJS.Signals) => {
+      if (!subprocess.killed) {
+        return subprocess.kill(signal);
+      }
+      return false;
+    },
+    then: promise.then.bind(promise),
+  };
+}
 
 // Helper function to extract author from XiaoHongShu page when yt-dlp doesn't provide it
 async function extractXiaoHongShuAuthor(url: string): Promise<string | null> {
-    try {
-        console.log("Attempting to extract XiaoHongShu author from webpage...");
-        const response = await axios.get(url, {
-            headers: {
-                'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36'
-            },
-            timeout: 10000
-        });
-        
-        const html = response.data;
-        
-        // Try to find author name in the JSON data embedded in the page
-        // XiaoHongShu embeds data in window.__INITIAL_STATE__
-        const match = html.match(/"nickname":"([^"]+)"/);
-        if (match && match[1]) {
-            console.log("Found XiaoHongShu author:", match[1]);
-            return match[1];
-        }
-        
-        // Alternative: try to find in user info
-        const userMatch = html.match(/"user":\{[^}]*"nickname":"([^"]+)"/);
-        if (userMatch && userMatch[1]) {
-            console.log("Found XiaoHongShu author (user):", userMatch[1]);
-            return userMatch[1];
-        }
-        
-        console.log("Could not extract XiaoHongShu author from webpage");
-        return null;
-    } catch (error) {
-        console.error("Error extracting XiaoHongShu author:", error);
-        return null;
+  try {
+    console.log("Attempting to extract XiaoHongShu author from webpage...");
+    const response = await axios.get(url, {
+      headers: {
+        "User-Agent":
+          "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Safari/537.36",
+      },
+      timeout: 10000,
+    });
+
+    const html = response.data;
+
+    // Try to find author name in the JSON data embedded in the page
+    // XiaoHongShu embeds data in window.__INITIAL_STATE__
+    const match = html.match(/"nickname":"([^"]+)"/);
+    if (match && match[1]) {
+      console.log("Found XiaoHongShu author:", match[1]);
+      return match[1];
     }
+
+    // Alternative: try to find in user info
+    const userMatch = html.match(/"user":\{[^}]*"nickname":"([^"]+)"/);
+    if (userMatch && userMatch[1]) {
+      console.log("Found XiaoHongShu author (user):", userMatch[1]);
+      return userMatch[1];
+    }
+
+    console.log("Could not extract XiaoHongShu author from webpage");
+    return null;
+  } catch (error) {
+    console.error("Error extracting XiaoHongShu author:", error);
+    return null;
+  }
 }
 
 export class YtDlpDownloader {
-    // Search for videos (primarily for YouTube, but could be adapted)
-    static async search(query: string): Promise<any[]> {
-        console.log("Processing search request for query:", query);
+  // Search for videos (primarily for YouTube, but could be adapted)
+  static async search(query: string): Promise<any[]> {
+    console.log("Processing search request for query:", query);
 
-        // Use ytsearch for searching
-        const searchResults = await youtubedl(`ytsearch5:${query}`, {
-            dumpSingleJson: true,
-            noWarnings: true,
-            skipDownload: true,
-            playlistEnd: 5, // Limit to 5 results
-            extractorArgs: `youtubepot-bgutilscript:script_path=${PROVIDER_SCRIPT}`,
-        } as any, { execPath: YT_DLP_PATH } as any);
+    // Use ytsearch for searching
+    const searchResults = await executeYtDlpJson(`ytsearch5:${query}`, {
+      noWarnings: true,
+      skipDownload: true,
+      playlistEnd: 5, // Limit to 5 results
+      extractorArgs: `youtubepot-bgutilscript:script_path=${PROVIDER_SCRIPT}`,
+    });
 
-        if (!searchResults || !(searchResults as any).entries) {
-            return [];
+    if (!searchResults || !searchResults.entries) {
+      return [];
+    }
+
+    // Format the search results
+    const formattedResults = searchResults.entries.map((entry: any) => ({
+      id: entry.id,
+      title: entry.title,
+      author: entry.uploader,
+      thumbnailUrl: entry.thumbnail,
+      duration: entry.duration,
+      viewCount: entry.view_count,
+      sourceUrl: `https://www.youtube.com/watch?v=${entry.id}`, // Default to YT for search results
+      source: "youtube",
+    }));
+
+    console.log(
+      `Found ${formattedResults.length} search results for "${query}"`
+    );
+
+    return formattedResults;
+  }
+
+  // Get video info without downloading
+  static async getVideoInfo(
+    url: string
+  ): Promise<{
+    title: string;
+    author: string;
+    date: string;
+    thumbnailUrl: string;
+  }> {
+    try {
+      const info = await executeYtDlpJson(url, {
+        noWarnings: true,
+        preferFreeFormats: true,
+        extractorArgs: `youtubepot-bgutilscript:script_path=${PROVIDER_SCRIPT}`,
+      });
+
+      return {
+        title: info.title || "Video",
+        author: info.uploader || "Unknown",
+        date:
+          info.upload_date ||
+          new Date().toISOString().slice(0, 10).replace(/-/g, ""),
+        thumbnailUrl: info.thumbnail,
+      };
+    } catch (error) {
+      console.error("Error fetching video info:", error);
+      return {
+        title: "Video",
+        author: "Unknown",
+        date: new Date().toISOString().slice(0, 10).replace(/-/g, ""),
+        thumbnailUrl: "",
+      };
+    }
+  }
+
+  // Get the latest video URL from a channel
+  static async getLatestVideoUrl(channelUrl: string): Promise<string | null> {
+    try {
+      console.log("Fetching latest video for channel:", channelUrl);
+
+      // Append /videos to channel URL to ensure we get videos and not the channel tab
+      let targetUrl = channelUrl;
+      if (
+        channelUrl.includes("youtube.com/") &&
+        !channelUrl.includes("/videos") &&
+        !channelUrl.includes("/shorts") &&
+        !channelUrl.includes("/streams")
+      ) {
+        // Check if it looks like a channel URL
+        if (
+          channelUrl.includes("/@") ||
+          channelUrl.includes("/channel/") ||
+          channelUrl.includes("/c/") ||
+          channelUrl.includes("/user/")
+        ) {
+          targetUrl = `${channelUrl}/videos`;
+          console.log("Modified channel URL to:", targetUrl);
         }
+      }
 
-        // Format the search results
-        const formattedResults = (searchResults as any).entries.map((entry: any) => ({
-            id: entry.id,
-            title: entry.title,
-            author: entry.uploader,
-            thumbnailUrl: entry.thumbnail,
-            duration: entry.duration,
-            viewCount: entry.view_count,
-            sourceUrl: `https://www.youtube.com/watch?v=${entry.id}`, // Default to YT for search results
-            source: "youtube",
-        }));
+      // Use yt-dlp to get the first video in the channel (playlist)
+      const result = await executeYtDlpJson(targetUrl, {
+        playlistEnd: 5,
+        noWarnings: true,
+        flatPlaylist: true, // We only need the ID/URL, not full info
+        extractorArgs: `youtubepot-bgutilscript:script_path=${PROVIDER_SCRIPT}`,
+      });
 
-        console.log(
-            `Found ${formattedResults.length} search results for "${query}"`
+      // If it's a playlist/channel, 'entries' will contain the videos
+      if (result.entries && result.entries.length > 0) {
+        // Iterate through entries to find a valid video
+        // Sometimes the first entry is the channel/tab itself (e.g. id starts with UC)
+        for (const entry of result.entries) {
+          // Skip entries that look like channel IDs (start with UC and are 24 chars)
+          // or entries without a title/url that look like metadata
+          if (entry.id && entry.id.startsWith("UC") && entry.id.length === 24) {
+            continue;
+          }
+
+          const videoId = entry.id;
+          if (videoId) {
+            return `https://www.youtube.com/watch?v=${videoId}`;
+          }
+          if (entry.url) {
+            return entry.url;
+          }
+        }
+      }
+      return null;
+    } catch (error) {
+      console.error("Error fetching latest video URL:", error);
+      return null;
+    }
+  }
+
+  // Download video
+  static async downloadVideo(
+    videoUrl: string,
+    downloadId?: string,
+    onStart?: (cancel: () => void) => void
+  ): Promise<Video> {
+    console.log("Detected URL:", videoUrl);
+
+    // Create a safe base filename (without extension)
+    const timestamp = Date.now();
+    const safeBaseFilename = `video_${timestamp}`;
+
+    // Add extensions for video and thumbnail
+    const videoFilename = `${safeBaseFilename}.mp4`;
+    const thumbnailFilename = `${safeBaseFilename}.jpg`;
+
+    let videoTitle,
+      videoAuthor,
+      videoDate,
+      videoDescription,
+      thumbnailUrl,
+      thumbnailSaved,
+      source;
+    let finalVideoFilename = videoFilename;
+    let finalThumbnailFilename = thumbnailFilename;
+    let subtitles: Array<{ language: string; filename: string; path: string }> =
+      [];
+
+    try {
+      // Get video info first
+      const info = await executeYtDlpJson(videoUrl, {
+        noWarnings: true,
+        preferFreeFormats: true,
+        extractorArgs: `youtubepot-bgutilscript:script_path=${PROVIDER_SCRIPT}`,
+      });
+
+      console.log("Video info:", {
+        title: info.title,
+        uploader: info.uploader,
+        upload_date: info.upload_date,
+        extractor: info.extractor,
+      });
+
+      videoTitle = info.title || "Video";
+      videoAuthor = info.uploader || "Unknown";
+
+      // If author is unknown and it's a XiaoHongShu video, try custom extraction
+      if (
+        (!info.uploader || info.uploader === "Unknown") &&
+        info.extractor === "XiaoHongShu"
+      ) {
+        const customAuthor = await extractXiaoHongShuAuthor(videoUrl);
+        if (customAuthor) {
+          videoAuthor = customAuthor;
+        }
+      }
+      videoDescription = info.description || "";
+      videoDate =
+        info.upload_date ||
+        new Date().toISOString().slice(0, 10).replace(/-/g, "");
+      thumbnailUrl = info.thumbnail;
+      source = info.extractor || "generic";
+
+      // Update the safe base filename with the actual title
+      const newSafeBaseFilename = formatVideoFilename(
+        videoTitle,
+        videoAuthor,
+        videoDate
+      );
+      const newVideoFilename = `${newSafeBaseFilename}.mp4`;
+      const newThumbnailFilename = `${newSafeBaseFilename}.jpg`;
+
+      // Update the filenames
+      finalVideoFilename = newVideoFilename;
+      finalThumbnailFilename = newThumbnailFilename;
+
+      // Update paths
+      const newVideoPath = path.join(VIDEOS_DIR, finalVideoFilename);
+      const newThumbnailPath = path.join(IMAGES_DIR, finalThumbnailFilename);
+
+      // Download the video
+      console.log("Downloading video to:", newVideoPath);
+
+      if (downloadId) {
+        storageService.updateActiveDownload(downloadId, {
+          filename: videoTitle,
+          progress: 0,
+        });
+      }
+
+      // Prepare flags
+      const flags: Record<string, any> = {
+        output: newVideoPath,
+        format: "bestvideo[ext=mp4]+bestaudio[ext=m4a]/best[ext=mp4]/best",
+        mergeOutputFormat: "mp4",
+        writeSubs: true,
+        writeAutoSubs: true,
+        convertSubs: "vtt",
+        extractorArgs: `youtubepot-bgutilscript:script_path=${PROVIDER_SCRIPT}`,
+      };
+
+      // Add YouTube specific flags if it's a YouTube URL
+      if (videoUrl.includes("youtube.com") || videoUrl.includes("youtu.be")) {
+        flags.format =
+          "bestvideo[ext=mp4][vcodec^=avc1]+bestaudio[ext=m4a][acodec=aac]/bestvideo[ext=mp4][vcodec=h264]+bestaudio[ext=m4a]/best[ext=mp4]/best";
+        // Combine YouTube extractor args with PO token provider
+        flags.extractorArgs = `youtube:player_client=android;youtubepot-bgutilscript:script_path=${PROVIDER_SCRIPT}`;
+        flags.addHeader = [
+          "Referer:https://www.youtube.com/",
+          "User-Agent:Mozilla/5.0 (Linux; Android 10; K) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Mobile Safari/537.36",
+        ];
+      }
+
+      // Use spawn to capture stdout for progress
+      const subprocess = executeYtDlpSpawn(videoUrl, flags);
+
+      if (onStart) {
+        onStart(() => {
+          console.log("Killing subprocess for download:", downloadId);
+          subprocess.kill();
+
+          // Clean up partial files
+          console.log("Cleaning up partial files...");
+          try {
+            const partVideoPath = `${newVideoPath}.part`;
+            const partThumbnailPath = `${newThumbnailPath}.part`;
+
+            if (fs.existsSync(partVideoPath)) {
+              fs.unlinkSync(partVideoPath);
+              console.log("Deleted partial video file:", partVideoPath);
+            }
+            if (fs.existsSync(newVideoPath)) {
+              fs.unlinkSync(newVideoPath);
+              console.log("Deleted partial video file:", newVideoPath);
+            }
+            if (fs.existsSync(partThumbnailPath)) {
+              fs.unlinkSync(partThumbnailPath);
+              console.log("Deleted partial thumbnail file:", partThumbnailPath);
+            }
+            if (fs.existsSync(newThumbnailPath)) {
+              fs.unlinkSync(newThumbnailPath);
+              console.log("Deleted partial thumbnail file:", newThumbnailPath);
+            }
+          } catch (cleanupError) {
+            console.error("Error cleaning up partial files:", cleanupError);
+          }
+        });
+      }
+
+      subprocess.stdout?.on("data", (data: Buffer) => {
+        const output = data.toString();
+        // Parse progress: [download]  23.5% of 10.00MiB at  2.00MiB/s ETA 00:05
+        const progressMatch = output.match(
+          /(\d+\.?\d*)%\s+of\s+([~\d\w.]+)\s+at\s+([~\d\w.\/]+)/
         );
 
-        return formattedResults;
-    }
+        if (progressMatch && downloadId) {
+          const percentage = parseFloat(progressMatch[1]);
+          const totalSize = progressMatch[2];
+          const speed = progressMatch[3];
 
-    // Get video info without downloading
-    static async getVideoInfo(url: string): Promise<{ title: string; author: string; date: string; thumbnailUrl: string }> {
-        try {
-            const info = await youtubedl(url, {
-                dumpSingleJson: true,
-                noWarnings: true,
-                preferFreeFormats: true,
-                // youtubeSkipDashManifest: true, // Specific to YT, might want to keep or make conditional
-                extractorArgs: `youtubepot-bgutilscript:script_path=${PROVIDER_SCRIPT}`,
-            } as any, { execPath: YT_DLP_PATH } as any);
-
-            return {
-                title: info.title || "Video",
-                author: info.uploader || "Unknown",
-                date: info.upload_date || new Date().toISOString().slice(0, 10).replace(/-/g, ""),
-                thumbnailUrl: info.thumbnail,
-            };
-        } catch (error) {
-            console.error("Error fetching video info:", error);
-            return {
-                title: "Video",
-                author: "Unknown",
-                date: new Date().toISOString().slice(0, 10).replace(/-/g, ""),
-                thumbnailUrl: "",
-            };
+          storageService.updateActiveDownload(downloadId, {
+            progress: percentage,
+            totalSize: totalSize,
+            speed: speed,
+          });
         }
-    }
+      });
 
-    // Get the latest video URL from a channel
-    static async getLatestVideoUrl(channelUrl: string): Promise<string | null> {
+      await subprocess;
+
+      console.log("Video downloaded successfully");
+
+      // Download and save the thumbnail
+      thumbnailSaved = false;
+
+      if (thumbnailUrl) {
         try {
-            console.log("Fetching latest video for channel:", channelUrl);
-            
-            // Append /videos to channel URL to ensure we get videos and not the channel tab
-            let targetUrl = channelUrl;
-            if (channelUrl.includes('youtube.com/') && !channelUrl.includes('/videos') && !channelUrl.includes('/shorts') && !channelUrl.includes('/streams')) {
-                // Check if it looks like a channel URL
-                if (channelUrl.includes('/@') || channelUrl.includes('/channel/') || channelUrl.includes('/c/') || channelUrl.includes('/user/')) {
-                    targetUrl = `${channelUrl}/videos`;
-                    console.log("Modified channel URL to:", targetUrl);
-                }
-            }
+          console.log("Downloading thumbnail from:", thumbnailUrl);
 
-            // Use yt-dlp to get the first video in the channel (playlist)
-            const result = await youtubedl(targetUrl, {
-                dumpSingleJson: true,
-                playlistEnd: 5,
-                noWarnings: true,
-                flatPlaylist: true, // We only need the ID/URL, not full info
-                extractorArgs: `youtubepot-bgutilscript:script_path=${PROVIDER_SCRIPT}`,
-            } as any, { execPath: YT_DLP_PATH } as any);
+          const thumbnailResponse = await axios({
+            method: "GET",
+            url: thumbnailUrl,
+            responseType: "stream",
+          });
 
-            // If it's a playlist/channel, 'entries' will contain the videos
-            if ((result as any).entries && (result as any).entries.length > 0) {
-                // Iterate through entries to find a valid video
-                // Sometimes the first entry is the channel/tab itself (e.g. id starts with UC)
-                for (const entry of (result as any).entries) {
-                    // Skip entries that look like channel IDs (start with UC and are 24 chars)
-                    // or entries without a title/url that look like metadata
-                    if (entry.id && entry.id.startsWith('UC') && entry.id.length === 24) {
-                        continue;
-                    }
+          const thumbnailWriter = fs.createWriteStream(newThumbnailPath);
+          thumbnailResponse.data.pipe(thumbnailWriter);
 
-                    const videoId = entry.id;
-                    if (videoId) {
-                        return `https://www.youtube.com/watch?v=${videoId}`;
-                    }
-                    if (entry.url) {
-                        return entry.url;
-                    }
-                }
-            }
-            return null;
-        } catch (error) {
-            console.error("Error fetching latest video URL:", error);
-            return null;
-        }
-    }
-
-    // Download video
-    static async downloadVideo(videoUrl: string, downloadId?: string, onStart?: (cancel: () => void) => void): Promise<Video> {
-        console.log("Detected URL:", videoUrl);
-
-        // Create a safe base filename (without extension)
-        const timestamp = Date.now();
-        const safeBaseFilename = `video_${timestamp}`;
-
-        // Add extensions for video and thumbnail
-        const videoFilename = `${safeBaseFilename}.mp4`;
-        const thumbnailFilename = `${safeBaseFilename}.jpg`;
-
-        let videoTitle, videoAuthor, videoDate, videoDescription, thumbnailUrl, thumbnailSaved, source;
-        let finalVideoFilename = videoFilename;
-        let finalThumbnailFilename = thumbnailFilename;
-        let subtitles: Array<{ language: string; filename: string; path: string }> = [];
-
-        try {
-            // Get video info first
-            const info = await youtubedl(videoUrl, {
-                dumpSingleJson: true,
-                noWarnings: true,
-                preferFreeFormats: true,
-                extractorArgs: `youtubepot-bgutilscript:script_path=${PROVIDER_SCRIPT}`,
-            } as any, { execPath: YT_DLP_PATH } as any);
-
-            console.log("Video info:", {
-                title: info.title,
-                uploader: info.uploader,
-                upload_date: info.upload_date,
-                extractor: info.extractor,
+          await new Promise<void>((resolve, reject) => {
+            thumbnailWriter.on("finish", () => {
+              thumbnailSaved = true;
+              resolve();
             });
+            thumbnailWriter.on("error", reject);
+          });
 
-            videoTitle = info.title || "Video";
-            videoAuthor = info.uploader || "Unknown";
-            
-            // If author is unknown and it's a XiaoHongShu video, try custom extraction
-            if ((!info.uploader || info.uploader === "Unknown") && info.extractor === "XiaoHongShu") {
-                const customAuthor = await extractXiaoHongShuAuthor(videoUrl);
-                if (customAuthor) {
-                    videoAuthor = customAuthor;
-                }
-            }
-            videoDescription = info.description || "";
-            videoDate =
-                info.upload_date ||
-                new Date().toISOString().slice(0, 10).replace(/-/g, "");
-            thumbnailUrl = info.thumbnail;
-            source = info.extractor || "generic";
-
-            // Update the safe base filename with the actual title
-            const newSafeBaseFilename = formatVideoFilename(videoTitle, videoAuthor, videoDate);
-            const newVideoFilename = `${newSafeBaseFilename}.mp4`;
-            const newThumbnailFilename = `${newSafeBaseFilename}.jpg`;
-
-            // Update the filenames
-            finalVideoFilename = newVideoFilename;
-            finalThumbnailFilename = newThumbnailFilename;
-
-            // Update paths
-            const newVideoPath = path.join(VIDEOS_DIR, finalVideoFilename);
-            const newThumbnailPath = path.join(IMAGES_DIR, finalThumbnailFilename);
-
-            // Download the video
-            console.log("Downloading video to:", newVideoPath);
-
-            if (downloadId) {
-                storageService.updateActiveDownload(downloadId, {
-                    filename: videoTitle,
-                    progress: 0
-                });
-            }
-
-            // Prepare flags
-            const flags: any = {
-                output: newVideoPath,
-                format: "bestvideo[ext=mp4]+bestaudio[ext=m4a]/best[ext=mp4]/best",
-                mergeOutputFormat: "mp4",
-                writeSubs: true,
-                writeAutoSubs: true,
-                convertSubs: "vtt",
-            };
-
-            // Add YouTube specific flags if it's a YouTube URL
-            if (videoUrl.includes("youtube.com") || videoUrl.includes("youtu.be")) {
-                 flags.format = "bestvideo[ext=mp4][vcodec^=avc1]+bestaudio[ext=m4a][acodec=aac]/bestvideo[ext=mp4][vcodec=h264]+bestaudio[ext=m4a]/best[ext=mp4]/best";
-                 flags['extractor-args'] = "youtube:player_client=android";
-                 flags.addHeader = [
-                    'Referer:https://www.youtube.com/',
-                    'User-Agent:Mozilla/5.0 (Linux; Android 10; K) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/120.0.0.0 Mobile Safari/537.36'
-                ];
-            }
-
-            // Add PO Token provider args
-            flags.extractorArgs = `youtubepot-bgutilscript:script_path=${PROVIDER_SCRIPT}`;
-
-            // Use exec to capture stdout for progress
-            const subprocess = youtubedl.exec(videoUrl, flags, { execPath: YT_DLP_PATH } as any);
-
-            if (onStart) {
-                onStart(() => {
-                    console.log("Killing subprocess for download:", downloadId);
-                    subprocess.kill();
-                    
-                    // Clean up partial files
-                    console.log("Cleaning up partial files...");
-                    try {
-                        const partVideoPath = `${newVideoPath}.part`;
-                        const partThumbnailPath = `${newThumbnailPath}.part`;
-                        
-                        if (fs.existsSync(partVideoPath)) {
-                            fs.unlinkSync(partVideoPath);
-                            console.log("Deleted partial video file:", partVideoPath);
-                        }
-                        if (fs.existsSync(newVideoPath)) {
-                            fs.unlinkSync(newVideoPath);
-                            console.log("Deleted partial video file:", newVideoPath);
-                        }
-                        if (fs.existsSync(partThumbnailPath)) {
-                            fs.unlinkSync(partThumbnailPath);
-                            console.log("Deleted partial thumbnail file:", partThumbnailPath);
-                        }
-                        if (fs.existsSync(newThumbnailPath)) {
-                            fs.unlinkSync(newThumbnailPath);
-                            console.log("Deleted partial thumbnail file:", newThumbnailPath);
-                        }
-                    } catch (cleanupError) {
-                        console.error("Error cleaning up partial files:", cleanupError);
-                    }
-                });
-            }
-
-            subprocess.stdout?.on('data', (data: Buffer) => {
-                const output = data.toString();
-                // Parse progress: [download]  23.5% of 10.00MiB at  2.00MiB/s ETA 00:05
-                const progressMatch = output.match(/(\d+\.?\d*)%\s+of\s+([~\d\w.]+)\s+at\s+([~\d\w.\/]+)/);
-
-                if (progressMatch && downloadId) {
-                    const percentage = parseFloat(progressMatch[1]);
-                    const totalSize = progressMatch[2];
-                    const speed = progressMatch[3];
-
-                    storageService.updateActiveDownload(downloadId, {
-                        progress: percentage,
-                        totalSize: totalSize,
-                        speed: speed
-                    });
-                }
-            });
-
-            await subprocess;
-
-            console.log("Video downloaded successfully");
-
-            // Download and save the thumbnail
-            thumbnailSaved = false;
-
-            if (thumbnailUrl) {
-                try {
-                    console.log("Downloading thumbnail from:", thumbnailUrl);
-
-                    const thumbnailResponse = await axios({
-                        method: "GET",
-                        url: thumbnailUrl,
-                        responseType: "stream",
-                    });
-
-                    const thumbnailWriter = fs.createWriteStream(newThumbnailPath);
-                    thumbnailResponse.data.pipe(thumbnailWriter);
-
-                    await new Promise<void>((resolve, reject) => {
-                        thumbnailWriter.on("finish", () => {
-                            thumbnailSaved = true;
-                            resolve();
-                        });
-                        thumbnailWriter.on("error", reject);
-                    });
-
-                    console.log("Thumbnail saved to:", newThumbnailPath);
-                } catch (thumbnailError) {
-                    console.error("Error downloading thumbnail:", thumbnailError);
-                    // Continue even if thumbnail download fails
-                }
-            }
-            // Scan for subtitle files
-            try {
-                const baseFilename = newSafeBaseFilename;
-                const subtitleFiles = fs.readdirSync(VIDEOS_DIR).filter((file: string) => 
-                    file.startsWith(baseFilename) && file.endsWith(".vtt")
-                );
-
-                console.log(`Found ${subtitleFiles.length} subtitle files`);
-
-                for (const subtitleFile of subtitleFiles) {
-                    // Parse language from filename (e.g., video_123.en.vtt -> en)
-                    const match = subtitleFile.match(/\.([a-z]{2}(?:-[A-Z]{2})?)(?:\..*?)?\.vtt$/);
-                    const language = match ? match[1] : "unknown";
-
-                    // Move subtitle to subtitles directory
-                    const sourceSubPath = path.join(VIDEOS_DIR, subtitleFile);
-                    const destSubFilename = `${baseFilename}.${language}.vtt`;
-                    const destSubPath = path.join(SUBTITLES_DIR, destSubFilename);
-
-                    // Read VTT file and fix alignment for centering
-                    let vttContent = fs.readFileSync(sourceSubPath, 'utf-8');
-                    // Replace align:start with align:middle for centered subtitles
-                    // Also remove position:0% which forces left positioning
-                    vttContent = vttContent.replace(/ align:start/g, ' align:middle');
-                    vttContent = vttContent.replace(/ position:0%/g, '');
-                    
-                    // Write cleaned VTT to destination
-                    fs.writeFileSync(destSubPath, vttContent, 'utf-8');
-                    
-                    // Remove original file
-                    fs.unlinkSync(sourceSubPath);
-                    
-                    console.log(`Processed and moved subtitle ${subtitleFile} to ${destSubPath}`);
-
-                    subtitles.push({
-                        language,
-                        filename: destSubFilename,
-                        path: `/subtitles/${destSubFilename}`,
-                    });
-                }
-            } catch (subtitleError) {
-                console.error("Error processing subtitle files:", subtitleError);
-            }
-
-        } catch (error) {
-            console.error("Error in download process:", error);
-            throw error;
+          console.log("Thumbnail saved to:", newThumbnailPath);
+        } catch (thumbnailError) {
+          console.error("Error downloading thumbnail:", thumbnailError);
+          // Continue even if thumbnail download fails
         }
+      }
+      // Scan for subtitle files
+      try {
+        const baseFilename = newSafeBaseFilename;
+        const subtitleFiles = fs
+          .readdirSync(VIDEOS_DIR)
+          .filter(
+            (file: string) =>
+              file.startsWith(baseFilename) && file.endsWith(".vtt")
+          );
 
-        // Create metadata for the video
-        const videoData: Video = {
-            id: timestamp.toString(),
-            title: videoTitle || "Video",
-            author: videoAuthor || "Unknown",
-            description: videoDescription,
-            date:
-                videoDate || new Date().toISOString().slice(0, 10).replace(/-/g, ""),
-            source: source, // Use extracted source
-            sourceUrl: videoUrl,
-            videoFilename: finalVideoFilename,
-            thumbnailFilename: thumbnailSaved ? finalThumbnailFilename : undefined,
-            thumbnailUrl: thumbnailUrl || undefined,
-            videoPath: `/videos/${finalVideoFilename}`,
-            thumbnailPath: thumbnailSaved
-                ? `/images/${finalThumbnailFilename}`
-                : null,
-            subtitles: subtitles.length > 0 ? subtitles : undefined,
-            duration: undefined, // Will be populated below
-            addedAt: new Date().toISOString(),
-            createdAt: new Date().toISOString(),
-        };
+        console.log(`Found ${subtitleFiles.length} subtitle files`);
 
-        // If duration is missing from info, try to extract it from file
-        const finalVideoPath = path.join(VIDEOS_DIR, finalVideoFilename);
-        
-        try {
-             const { getVideoDuration } = await import("../../services/metadataService");
-             const duration = await getVideoDuration(finalVideoPath);
-             if (duration) {
-                 videoData.duration = duration.toString();
-             }
-        } catch (e) {
-             console.error("Failed to extract duration from downloaded file:", e);
+        for (const subtitleFile of subtitleFiles) {
+          // Parse language from filename (e.g., video_123.en.vtt -> en)
+          const match = subtitleFile.match(
+            /\.([a-z]{2}(?:-[A-Z]{2})?)(?:\..*?)?\.vtt$/
+          );
+          const language = match ? match[1] : "unknown";
+
+          // Move subtitle to subtitles directory
+          const sourceSubPath = path.join(VIDEOS_DIR, subtitleFile);
+          const destSubFilename = `${baseFilename}.${language}.vtt`;
+          const destSubPath = path.join(SUBTITLES_DIR, destSubFilename);
+
+          // Read VTT file and fix alignment for centering
+          let vttContent = fs.readFileSync(sourceSubPath, "utf-8");
+          // Replace align:start with align:middle for centered subtitles
+          // Also remove position:0% which forces left positioning
+          vttContent = vttContent.replace(/ align:start/g, " align:middle");
+          vttContent = vttContent.replace(/ position:0%/g, "");
+
+          // Write cleaned VTT to destination
+          fs.writeFileSync(destSubPath, vttContent, "utf-8");
+
+          // Remove original file
+          fs.unlinkSync(sourceSubPath);
+
+          console.log(
+            `Processed and moved subtitle ${subtitleFile} to ${destSubPath}`
+          );
+
+          subtitles.push({
+            language,
+            filename: destSubFilename,
+            path: `/subtitles/${destSubFilename}`,
+          });
         }
-
-        // Get file size
-        try {
-            if (fs.existsSync(finalVideoPath)) {
-                const stats = fs.statSync(finalVideoPath);
-                videoData.fileSize = stats.size.toString();
-            }
-        } catch (e) {
-            console.error("Failed to get file size:", e);
-        }
-
-        // Save the video
-        storageService.saveVideo(videoData);
-
-        console.log("Video added to database");
-
-        return videoData;
+      } catch (subtitleError) {
+        console.error("Error processing subtitle files:", subtitleError);
+      }
+    } catch (error) {
+      console.error("Error in download process:", error);
+      throw error;
     }
+
+    // Create metadata for the video
+    const videoData: Video = {
+      id: timestamp.toString(),
+      title: videoTitle || "Video",
+      author: videoAuthor || "Unknown",
+      description: videoDescription,
+      date:
+        videoDate || new Date().toISOString().slice(0, 10).replace(/-/g, ""),
+      source: source, // Use extracted source
+      sourceUrl: videoUrl,
+      videoFilename: finalVideoFilename,
+      thumbnailFilename: thumbnailSaved ? finalThumbnailFilename : undefined,
+      thumbnailUrl: thumbnailUrl || undefined,
+      videoPath: `/videos/${finalVideoFilename}`,
+      thumbnailPath: thumbnailSaved
+        ? `/images/${finalThumbnailFilename}`
+        : null,
+      subtitles: subtitles.length > 0 ? subtitles : undefined,
+      duration: undefined, // Will be populated below
+      addedAt: new Date().toISOString(),
+      createdAt: new Date().toISOString(),
+    };
+
+    // If duration is missing from info, try to extract it from file
+    const finalVideoPath = path.join(VIDEOS_DIR, finalVideoFilename);
+
+    try {
+      const { getVideoDuration } = await import(
+        "../../services/metadataService"
+      );
+      const duration = await getVideoDuration(finalVideoPath);
+      if (duration) {
+        videoData.duration = duration.toString();
+      }
+    } catch (e) {
+      console.error("Failed to extract duration from downloaded file:", e);
+    }
+
+    // Get file size
+    try {
+      if (fs.existsSync(finalVideoPath)) {
+        const stats = fs.statSync(finalVideoPath);
+        videoData.fileSize = stats.size.toString();
+      }
+    } catch (e) {
+      console.error("Failed to get file size:", e);
+    }
+
+    // Save the video
+    storageService.saveVideo(videoData);
+
+    console.log("Video added to database");
+
+    return videoData;
+  }
 }
diff --git a/build-and-push.sh b/build-and-push.sh
index ee5ed70..79a31f0 100755
--- a/build-and-push.sh
+++ b/build-and-push.sh
@@ -5,8 +5,8 @@ DOCKER_PATH="/Applications/Docker.app/Contents/Resources/bin/docker"
 USERNAME="franklioxygen"
 VERSION=$1
 
-BACKEND_LATEST="$USERNAME/mytube:backend-latest"
-FRONTEND_LATEST="$USERNAME/mytube:frontend-latest"
+BACKEND_LATEST="$USERNAME/mytube:backend-test"
+FRONTEND_LATEST="$USERNAME/mytube:frontend-test"
 
 if [ -n "$VERSION" ]; then
   echo "🔖 Version specified: $VERSION"