steipete · steipete · Apr 7, 2026 · Mar 25, 2026 · Apr 7, 2026
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -6,6 +6,8 @@
 
 - Slides: support `--slides` for local video files in the main CLI and `summarize slides`, route local videos through the shared slide-aware flow, and document the local-file workflow (#149, thanks @steipete).
 
+- Config: allow setting a default summary length via `output.length`, and keep prompt-override runs aligned with the configured length/language defaults in both CLI and daemon flows (#178, thanks @maciej).
+
 ### Fixes
 
 - YouTube: detect obviously truncated caption-track transcripts on long videos and fall through to yt-dlp transcription instead of caching a broken partial result (#184, thanks @sportiz91).

diff --git a/README.md b/README.md
@@ -211,6 +211,8 @@ summarize "https://open.spotify.com/episode/5auotqWAXhhKyb9ymCuBJY"
 
 `--length` controls how much output we ask for (guideline), not a hard cap.
 
+Set a default in `~/.summarize/config.json` with `output.length`.
+
 ```bash
 summarize "https://example.com" --length long
 summarize "https://example.com" --length 20k
@@ -512,6 +514,7 @@ Supported keys today:
 {
   "model": { "id": "openai/gpt-5-mini" },
   "env": { "OPENAI_API_KEY": "sk-..." },
+  "output": { "length": "long" },
   "ui": { "theme": "ember" }
 }
 ```
@@ -531,6 +534,7 @@ Also supported:
 - `models` (define presets selectable via `--model <preset>`)
 - `env` (generic env var defaults; process env still wins)
 - `apiKeys` (legacy shortcut, mapped to env names; prefer `env` for new configs)
+- `output.length` (default `--length`: `short|medium|long|xl|xxl|20k`)
 - `cache.media` (media download cache: TTL 7 days, 2048 MB cap by default; `--no-media-cache` disables)
 - `media.videoMode: "auto"|"transcript"|"understand"`
 - `slides.enabled` / `slides.max` / `slides.ocr` / `slides.dir` (defaults for `--slides`)

diff --git a/docs/config.md b/docs/config.md
@@ -29,6 +29,12 @@ For output language:
 2. Config file `output.language` (preferred) or `language` (legacy)
 3. Built-in default (`auto` = match source content language)
 
+For output length:
+
+1. CLI flag `--length`
+2. Config file `output.length`
+3. Built-in default (`xl`)
+
 See `docs/language.md` for supported values.
 
 For prompt:
@@ -58,12 +64,18 @@ For UI theme:
 {
   "model": { "id": "google/gemini-3-flash" },
   "env": { "OPENAI_API_KEY": "sk-..." },
-  "output": { "language": "auto" },
+  "output": { "language": "auto", "length": "long" },
   "prompt": "Explain like I am five.",
   "ui": { "theme": "ember" }
 }
 ```
 
+`output.length` accepts the same values as `--length`:
+
+- Presets: `short`, `medium`, `long`, `xl`, `xxl`
+- Shorthand: `s`, `m`, `l`
+- Character targets: `1500`, `20k`, `20000`
+
 Shorthand (equivalent):
 
 ```json

diff --git a/docs/llm.md b/docs/llm.md
@@ -73,7 +73,8 @@ installed, auto mode can use local CLI models via `cli.enabled` or implicit auto
 - `--length short|medium|long|xl|xxl|<chars>`
   - This is _soft guidance_ to the model (no hard truncation).
   - Minimum numeric value: 50 chars.
-  - Default: `long`.
+  - Built-in default: `xl`.
+  - Config default: `output.length` in `~/.summarize/config.json`.
   - Output format is Markdown; use short paragraphs and only add bullets when they improve scanability.
 - `--force-summary`
   - Always run the LLM even when extracted content is shorter than the requested length.

diff --git a/src/config/sections.ts b/src/config/sections.ts
@@ -1,3 +1,4 @@
+import { parseLengthArg } from "../flags.js";
 import { isCliThemeName, listCliThemes } from "../tty/theme.js";
 import {
   isRecord,
@@ -364,7 +365,30 @@ export function parseOutputConfig(root: Record<string, unknown>, path: string) {
     typeof value.language === "string" && value.language.trim().length > 0
       ? value.language.trim()
       : undefined;
-  return typeof language === "string" ? { language } : undefined;
+  const length = (() => {
+    if (typeof value.length === "undefined") return undefined;
+    if (typeof value.length !== "string") {
+      throw new Error(`Invalid config file ${path}: "output.length" must be a string.`);
+    }
+    const trimmed = value.length.trim();
+    if (!trimmed) {
+      throw new Error(`Invalid config file ${path}: "output.length" must not be empty.`);
+    }
+    try {
+      parseLengthArg(trimmed);
+    } catch (error) {
+      throw new Error(
+        `Invalid config file ${path}: "output.length" is invalid: ${(error as Error).message}`,
+      );
+    }
+    return trimmed;
+  })();
+  return typeof language === "string" || typeof length === "string"
+    ? {
+        ...(typeof language === "string" ? { language } : {}),
+        ...(typeof length === "string" ? { length } : {}),
+      }
+    : undefined;
 }
 
 export function parseUiConfig(root: Record<string, unknown>, path: string) {

diff --git a/src/config/types.ts b/src/config/types.ts
@@ -213,6 +213,12 @@ export type SummarizeConfig = {
      * - otherwise: translate the output into the requested language
      */
     language?: string;
+    /**
+     * Default summary length (same values as `--length`).
+     *
+     * Examples: "short", "long", "xl", "20k".
+     */
+    length?: string;
   };
   ui?: {
     /**

diff --git a/src/daemon/flow-context.ts b/src/daemon/flow-context.ts
@@ -20,6 +20,7 @@ import { createRunMetrics } from "../run/run-metrics.js";
 import { resolveModelSelection } from "../run/run-models.js";
 import { resolveDesiredOutputTokens } from "../run/run-output.js";
 import {
+  buildPromptLengthInstruction,
   type RunOverrides,
   resolveOutputLanguageSetting,
   resolveSummaryLength,
@@ -133,7 +134,6 @@ export function createDaemonUrlFlowContext(args: DaemonUrlFlowContextArgs): UrlF
 
   const languageExplicitlySet = typeof languageRaw === "string" && Boolean(languageRaw.trim());
 
-  const { lengthArg } = resolveSummaryLength(lengthRaw);
   const resolvedOverrides: RunOverrides = overrides ?? {
     firecrawlMode: null,
     markdownMode: null,
@@ -200,6 +200,7 @@ export function createDaemonUrlFlowContext(args: DaemonUrlFlowContextArgs): UrlF
   });
   const configForCliWithMagic = applyAutoCliFallbackOverrides(configForCli, resolvedOverrides);
   const allowAutoCliFallback = resolvedOverrides.autoCliFallbackEnabled === true;
+  const { lengthArg } = resolveSummaryLength(lengthRaw, config?.output?.length ?? "xl");
 
   const {
     requestedModel,
@@ -279,16 +280,9 @@ export function createDaemonUrlFlowContext(args: DaemonUrlFlowContextArgs): UrlF
     fallback: outputLanguageFromConfig,
   });
 
-  const lengthInstruction =
-    promptOverride && lengthArg.kind === "chars"
-      ? `Output is ${lengthArg.maxCharacters.toLocaleString()} characters.`
-      : null;
-  const languageExplicit =
-    typeof languageRaw === "string" &&
-    languageRaw.trim().length > 0 &&
-    languageRaw.trim().toLowerCase() !== "auto";
+  const lengthInstruction = promptOverride ? buildPromptLengthInstruction(lengthArg) : null;
   const languageInstruction =
-    promptOverride && languageExplicit && outputLanguage.kind === "fixed"
+    promptOverride && outputLanguage.kind === "fixed"
       ? `Output should be ${outputLanguage.label}.`
       : null;
 

diff --git a/src/run/help.ts b/src/run/help.ts
@@ -79,7 +79,7 @@ export function buildProgram() {
     )
     .option(
       "--length <length>",
-      "Summary length: short|medium|long|xl|xxl (or s/m/l) or a character limit like 20000, 20k",
+      "Summary length: short|medium|long|xl|xxl (or s/m/l) or a character limit like 20000, 20k (default: xl; configurable via ~/.summarize/config.json output.length)",
       "xl",
     )
     .option(

diff --git a/src/run/run-settings.ts b/src/run/run-settings.ts
@@ -20,7 +20,7 @@ import {
 } from "../flags.js";
 import type { OutputLanguage } from "../language.js";
 import { resolveOutputLanguage } from "../language.js";
-import type { SummaryLengthTarget } from "../prompts/index.js";
+import { formatPresetLengthGuidance, type SummaryLengthTarget } from "../prompts/index.js";
 import {
   parseCliProvider,
   parseOptionalBoolean,
@@ -90,6 +90,12 @@ export function resolveSummaryLength(
   return { lengthArg, summaryLength };
 }
 
+export function buildPromptLengthInstruction(lengthArg: LengthArg): string {
+  return lengthArg.kind === "chars"
+    ? `Output is ${lengthArg.maxCharacters.toLocaleString()} characters.`
+    : formatPresetLengthGuidance(lengthArg.preset);
+}
+
 export function resolveOutputLanguageSetting({
   raw,
   fallback,

diff --git a/src/run/runner-plan.ts b/src/run/runner-plan.ts
@@ -18,6 +18,7 @@ import { resolveRunInput } from "./run-input.js";
 import { createRunMetrics } from "./run-metrics.js";
 import { resolveModelSelection } from "./run-models.js";
 import { resolveDesiredOutputTokens } from "./run-output.js";
+import { buildPromptLengthInstruction, resolveSummaryLength } from "./run-settings.js";
 import { resolveStreamSettings } from "./run-stream.js";
 import { createRunnerFlowContexts } from "./runner-contexts.js";
 import { executeRunnerInput } from "./runner-execution.js";
@@ -87,7 +88,7 @@ export async function createRunnerPlan(options: {
     isYoutubeUrl,
     format,
     youtubeMode,
-    lengthArg,
+    lengthArg: requestedLengthArg,
     maxOutputTokensArg,
     timeoutMs,
     retries,
@@ -176,6 +177,9 @@ export async function createRunnerPlan(options: {
   if (!promptOverride && typeof config?.prompt === "string" && config.prompt.trim().length > 0) {
     promptOverride = config.prompt.trim();
   }
+  const lengthArg = lengthExplicitlySet
+    ? requestedLengthArg
+    : resolveSummaryLength(config?.output?.length).lengthArg;
 
   const slidesSettings = resolveRunnerSlidesSettings({
     normalizedArgv,
@@ -185,12 +189,9 @@ export async function createRunnerPlan(options: {
   });
   const transcriptTimestamps = Boolean(programOpts.timestamps) || Boolean(slidesSettings);
 
-  const lengthInstruction =
-    promptOverride && lengthExplicitlySet && lengthArg.kind === "chars"
-      ? `Output is ${lengthArg.maxCharacters.toLocaleString()} characters.`
-      : null;
+  const lengthInstruction = promptOverride ? buildPromptLengthInstruction(lengthArg) : null;
   const languageInstruction =
-    promptOverride && languageExplicitlySet && outputLanguage.kind === "fixed"
+    promptOverride && outputLanguage.kind === "fixed"
       ? `Output should be ${outputLanguage.label}.`
       : null;
 

diff --git a/tests/cli.config-precedence.test.ts b/tests/cli.config-precedence.test.ts
@@ -52,6 +52,12 @@ function captureStream() {
   return { stream, getText: () => text };
 }
 
+function resolveFetchUrl(input: RequestInfo | URL): string {
+  if (typeof input === "string") return input;
+  if (input instanceof URL) return input.toString();
+  return input.url;
+}
+
 describe("cli config precedence", () => {
   it("uses config file model when --model and SUMMARIZE_MODEL are absent", async () => {
     mocks.completeSimple.mockClear();
@@ -61,7 +67,7 @@ describe("cli config precedence", () => {
       "<body><article><p>Hi</p></article></body></html>";
 
     const fetchMock = vi.fn(async (input: RequestInfo | URL) => {
-      const url = typeof input === "string" ? input : input.url;
+      const url = resolveFetchUrl(input);
       if (url === "https://example.com") return htmlResponse(html);
       throw new Error(`Unexpected fetch call: ${url}`);
     });
@@ -89,7 +95,7 @@ describe("cli config precedence", () => {
       "<body><article><p>Hi</p></article></body></html>";
 
     const fetchMock = vi.fn(async (input: RequestInfo | URL) => {
-      const url = typeof input === "string" ? input : input.url;
+      const url = resolveFetchUrl(input);
       if (url === "https://example.com") return htmlResponse(html);
       throw new Error(`Unexpected fetch call: ${url}`);
     });
@@ -138,7 +144,7 @@ describe("cli config precedence", () => {
       "<body><article><p>Hi</p></article></body></html>";
 
     const fetchMock = vi.fn(async (input: RequestInfo | URL) => {
-      const url = typeof input === "string" ? input : input.url;
+      const url = resolveFetchUrl(input);
       if (url === "https://example.com") return htmlResponse(html);
       throw new Error(`Unexpected fetch call: ${url}`);
     });
@@ -170,4 +176,76 @@ describe("cli config precedence", () => {
     // --extract means no LLM calls; ensure we didn't try to init a provider.
     expect(mocks.completeSimple).toHaveBeenCalledTimes(0);
   });
+
+  it("uses config file output.length when --length is absent", async () => {
+    mocks.completeSimple.mockClear();
+
+    const html =
+      "<!doctype html><html><head><title>Hello</title></head>" +
+      "<body><article><p>Hi</p></article></body></html>";
+
+    const fetchMock = vi.fn(async (input: RequestInfo | URL) => {
+      const url = resolveFetchUrl(input);
+      if (url === "https://example.com") return htmlResponse(html);
+      throw new Error(`Unexpected fetch call: ${url}`);
+    });
+
+    const tempRoot = mkdtempSync(join(tmpdir(), "summarize-cli-config-"));
+    const configPath = join(tempRoot, ".summarize", "config.json");
+    mkdirSync(join(tempRoot, ".summarize"), { recursive: true });
+    writeFileSync(
+      configPath,
+      JSON.stringify({ model: { id: "openai/gpt-5.2" }, output: { length: "short" } }),
+      "utf8",
+    );
+
+    const stdout = captureStream();
+
+    await runCli(["--timeout", "2s", "--json", "https://example.com"], {
+      env: { HOME: tempRoot, OPENAI_API_KEY: "test" },
+      fetch: fetchMock as unknown as typeof fetch,
+      stdout: stdout.stream,
+      stderr: noopStream(),
+    });
+
+    const parsed = JSON.parse(stdout.getText()) as { input: { length: { preset: string } } };
+    expect(parsed.input.length).toEqual({ kind: "preset", preset: "short" });
+  });
+
+  it("prefers --length over config file output.length", async () => {
+    mocks.completeSimple.mockClear();
+
+    const html =
+      "<!doctype html><html><head><title>Hello</title></head>" +
+      "<body><article><p>Hi</p></article></body></html>";
+
+    const fetchMock = vi.fn(async (input: RequestInfo | URL) => {
+      const url = resolveFetchUrl(input);
+      if (url === "https://example.com") return htmlResponse(html);
+      throw new Error(`Unexpected fetch call: ${url}`);
+    });
+
+    const tempRoot = mkdtempSync(join(tmpdir(), "summarize-cli-config-"));
+    const configPath = join(tempRoot, ".summarize", "config.json");
+    mkdirSync(join(tempRoot, ".summarize"), { recursive: true });
+    writeFileSync(
+      configPath,
+      JSON.stringify({ model: { id: "openai/gpt-5.2" }, output: { length: "short" } }),
+      "utf8",
+    );
+
+    const stdout = captureStream();
+
+    await runCli(["--timeout", "2s", "--length", "20k", "--json", "https://example.com"], {
+      env: { HOME: tempRoot, OPENAI_API_KEY: "test" },
+      fetch: fetchMock as unknown as typeof fetch,
+      stdout: stdout.stream,
+      stderr: noopStream(),
+    });
+
+    const parsed = JSON.parse(stdout.getText()) as {
+      input: { length: { kind: string; maxCharacters: number } };
+    };
+    expect(parsed.input.length).toEqual({ kind: "chars", maxCharacters: 20000 });
+  });
 });