add "captions" as download format

2026-03-18 14:33:50 +00:00 · 2026-02-21 19:06:49 +02:00
parent e24890fd9b
commit 973a87ffc6
4 changed files with 48 additions and 4 deletions
--- a/README.md
+++ b/README.md
@@ -59,6 +59,7 @@ Certain values can be set via environment variables, using the `-e` parameter on
 * __OUTPUT_TEMPLATE_CHANNEL__: The template for the filenames of the downloaded videos when downloaded as a channel. Defaults to `%(channel)s/%(title)s.%(ext)s`. When empty, then `OUTPUT_TEMPLATE` is used.
 * __YTDL_OPTIONS__: Additional options to pass to yt-dlp in JSON format. [See available options here](https://github.com/yt-dlp/yt-dlp/blob/master/yt_dlp/YoutubeDL.py#L222). They roughly correspond to command-line options, though some do not have exact equivalents here. For example, `--recode-video` has to be specified via `postprocessors`. Also note that dashes are replaced with underscores. You may find [this script](https://github.com/yt-dlp/yt-dlp/blob/master/devscripts/cli_to_api.py) helpful for converting from command-line options to `YTDL_OPTIONS`.
 * __YTDL_OPTIONS_FILE__: A path to a JSON file that will be loaded and used for populating `YTDL_OPTIONS` above. Please note that if both `YTDL_OPTIONS_FILE` and `YTDL_OPTIONS` are specified, the options in `YTDL_OPTIONS` take precedence. The file will be monitored for changes and reloaded automatically when changes are detected.
+* UI format __Captions (EN, VTT)__: Downloads subtitles/captions only (no media) by applying yt-dlp options equivalent to `--skip-download --write-subs --write-auto-subs --sub-langs en --sub-format vtt`.

 ### 🌐 Web Server & URLs

--- a/app/dl_formats.py
+++ b/app/dl_formats.py
@@ -26,6 +26,10 @@ def get_format(format: str, quality: str) -> str:
        # Quality is irrelevant in this case since we skip the download
        return "bestaudio/best"

+    if format == "captions":
+        # Quality is irrelevant in this case since we skip the download
+        return "bestaudio/best"
+
    if format in AUDIO_FORMATS:
        # Audio quality needs to be set post-download, set in opts
        return f"bestaudio[ext={format}]/bestaudio/best"
@@ -98,6 +102,13 @@ def get_opts(format: str, quality: str, ytdl_opts: dict) -> dict:
            {"key": "FFmpegThumbnailsConvertor", "format": "jpg", "when": "before_dl"}
        )

+    if format == "captions":
+        opts["skip_download"] = True
+        opts["writesubtitles"] = True
+        opts["writeautomaticsub"] = True
+        opts["subtitleslangs"] = ["en"]
+        opts["subtitlesformat"] = "vtt"
+
    opts["postprocessors"] = postprocessors + (
        opts["postprocessors"] if "postprocessors" in opts else []
    )
--- a/app/ytdl.py
+++ b/app/ytdl.py
@@ -160,6 +160,14 @@ class Download:
                    else:
                        filename = filepath
                    self.status_queue.put({'status': 'finished', 'filename': filename})
+                    # For captions-only downloads, yt-dlp may still report a media-like
+                    # filepath in MoveFiles. Capture subtitle outputs explicitly so the
+                    # UI can link to real caption files.
+                    if self.info.format == 'captions':
+                        requested_subtitles = d.get('info_dict', {}).get('requested_subtitles', {}) or {}
+                        for subtitle in requested_subtitles.values():
+                            if isinstance(subtitle, dict) and subtitle.get('filepath'):
+                                self.status_queue.put({'subtitle_file': subtitle['filepath']})

                # Capture all chapter files when SplitChapters finishes
                elif d.get('postprocessor') == 'SplitChapters' and d.get('status') == 'finished':
@@ -260,10 +268,14 @@ class Download:
            self.tmpfilename = status.get('tmpfilename')
            if 'filename' in status:
                fileName = status.get('filename')
-                self.info.filename = os.path.relpath(fileName, self.download_dir)
-                self.info.size = os.path.getsize(fileName) if os.path.exists(fileName) else None
-                if self.info.format == 'thumbnail':
-                    self.info.filename = re.sub(r'\.webm$', '.jpg', self.info.filename)
+                rel_name = os.path.relpath(fileName, self.download_dir)
+                # For captions mode, ignore media-like placeholders and let subtitle_file
+                # statuses define the final file shown in the UI.
+                if not (self.info.format == 'captions' and not rel_name.endswith(('.vtt', '.srt', '.ass', '.ttml'))):
+                    self.info.filename = rel_name
+                    self.info.size = os.path.getsize(fileName) if os.path.exists(fileName) else None
+                    if self.info.format == 'thumbnail':
+                        self.info.filename = re.sub(r'\.webm$', '.jpg', self.info.filename)

            # Handle chapter files
            log.debug(f"Update status for {self.info.title}: {status}")
@@ -280,6 +292,21 @@ class Download:
                # Skip the rest of status processing for chapter files
                continue

+            if 'subtitle_file' in status:
+                subtitle_file = status.get('subtitle_file')
+                if not hasattr(self.info, 'subtitle_files'):
+                    self.info.subtitle_files = []
+                rel_path = os.path.relpath(subtitle_file, self.download_dir)
+                file_size = os.path.getsize(subtitle_file) if os.path.exists(subtitle_file) else None
+                existing = next((sf for sf in self.info.subtitle_files if sf['filename'] == rel_path), None)
+                if not existing:
+                    self.info.subtitle_files.append({'filename': rel_path, 'size': file_size})
+                # Prefer first subtitle file as the primary result link in captions mode.
+                if self.info.format == 'captions' and (not getattr(self.info, 'filename', None)):
+                    self.info.filename = rel_path
+                    self.info.size = file_size
+                continue
+
            self.info.status = status['status']
            self.info.msg = status.get('msg')
            if 'downloaded_bytes' in status:
--- a/ui/src/app/interfaces/formats.ts
+++ b/ui/src/app/interfaces/formats.ts
@@ -73,4 +73,9 @@ export const Formats: Format[] = [
    text: 'Thumbnail',
    qualities: [{ id: 'best', text: 'Best' }],
  },
+  {
+    id: 'captions',
+    text: 'Captions (EN, VTT)',
+    qualities: [{ id: 'best', text: 'Best' }],
+  },
 ];