feat: add AniList character dictionary sync

2026-04-10 16:19:24 -07:00 · 2026-03-05 22:43:19 -08:00
parent 2f07c3407a
commit 33ded3c1bf
117 changed files with 3579 additions and 6443 deletions
--- a/src/main/character-dictionary-runtime.ts
+++ b/src/main/character-dictionary-runtime.ts
@@ -0,0 +1,955 @@
+import * as fs from 'fs';
+import * as os from 'os';
+import * as path from 'path';
+import type { AnilistMediaGuess } from '../core/services/anilist/anilist-updater';
+
+const ANILIST_GRAPHQL_URL = 'https://graphql.anilist.co';
+const HONORIFIC_SUFFIXES = [
+  'さん',
+  '様',
+  '先生',
+  '先輩',
+  '後輩',
+  '氏',
+  '君',
+  'くん',
+  'ちゃん',
+  'たん',
+  '坊',
+  '殿',
+  '博士',
+  '社長',
+  '部長',
+] as const;
+const VIDEO_EXTENSIONS = new Set([
+  '.mkv',
+  '.mp4',
+  '.avi',
+  '.webm',
+  '.mov',
+  '.flv',
+  '.wmv',
+  '.m4v',
+  '.ts',
+  '.m2ts',
+]);
+
+type CharacterDictionaryRole = 'main' | 'primary' | 'side' | 'appears';
+
+type CharacterDictionaryCacheEntry = {
+  mediaId: number;
+  mediaTitle: string;
+  entryCount: number;
+  zipPath: string;
+  updatedAt: number;
+  formatVersion?: number;
+  dictionaryTitle?: string;
+  revision?: string;
+};
+
+type CharacterDictionaryCacheFile = {
+  anilistById: Record<string, CharacterDictionaryCacheEntry>;
+};
+
+const CHARACTER_DICTIONARY_FORMAT_VERSION = 8;
+
+type AniListSearchResponse = {
+  Page?: {
+    media?: Array<{
+      id: number;
+      episodes?: number | null;
+      title?: {
+        romaji?: string | null;
+        english?: string | null;
+        native?: string | null;
+      };
+    }>;
+  };
+};
+
+type AniListCharacterPageResponse = {
+  Media?: {
+    title?: {
+      romaji?: string | null;
+      english?: string | null;
+      native?: string | null;
+    };
+    characters?: {
+      pageInfo?: {
+        hasNextPage?: boolean | null;
+      };
+      edges?: Array<{
+        role?: string | null;
+        node?: {
+          id: number;
+          description?: string | null;
+          image?: {
+            large?: string | null;
+            medium?: string | null;
+          } | null;
+          name?: {
+            full?: string | null;
+            native?: string | null;
+          } | null;
+        } | null;
+      } | null>;
+    } | null;
+  } | null;
+};
+
+type CharacterRecord = {
+  id: number;
+  role: CharacterDictionaryRole;
+  fullName: string;
+  nativeName: string;
+  description: string;
+  imageUrl: string | null;
+};
+
+type ZipEntry = {
+  name: string;
+  data: Buffer;
+  crc32: number;
+  localHeaderOffset: number;
+};
+
+export type CharacterDictionaryBuildResult = {
+  zipPath: string;
+  fromCache: boolean;
+  mediaId: number;
+  mediaTitle: string;
+  entryCount: number;
+  dictionaryTitle?: string;
+  revision?: string;
+};
+
+export type CharacterDictionaryGenerateOptions = {
+  refreshTtlMs?: number;
+};
+
+export interface CharacterDictionaryRuntimeDeps {
+  userDataPath: string;
+  getCurrentMediaPath: () => string | null;
+  getCurrentMediaTitle: () => string | null;
+  resolveMediaPathForJimaku: (mediaPath: string | null) => string | null;
+  guessAnilistMediaInfo: (
+    mediaPath: string | null,
+    mediaTitle: string | null,
+  ) => Promise<AnilistMediaGuess | null>;
+  now: () => number;
+  logInfo?: (message: string) => void;
+  logWarn?: (message: string) => void;
+}
+
+type ResolvedAniListMedia = {
+  id: number;
+  title: string;
+};
+
+function sleep(ms: number): Promise<void> {
+  return new Promise((resolve) => setTimeout(resolve, ms));
+}
+
+function normalizeTitle(value: string): string {
+  return value.trim().toLowerCase().replace(/\s+/g, ' ');
+}
+
+function pickAniListSearchResult(
+  title: string,
+  episode: number | null,
+  media: Array<{
+    id: number;
+    episodes?: number | null;
+    title?: {
+      romaji?: string | null;
+      english?: string | null;
+      native?: string | null;
+    };
+  }>,
+): ResolvedAniListMedia | null {
+  if (media.length === 0) return null;
+
+  const episodeFiltered =
+    typeof episode === 'number' && episode > 0
+      ? media.filter((entry) => entry.episodes == null || entry.episodes >= episode)
+      : media;
+  const candidates = episodeFiltered.length > 0 ? episodeFiltered : media;
+  const normalizedInput = normalizeTitle(title);
+  const exact = candidates.find((entry) => {
+    const candidateTitles = [entry.title?.romaji, entry.title?.english, entry.title?.native]
+      .filter((value): value is string => typeof value === 'string' && value.trim().length > 0)
+      .map((value) => normalizeTitle(value));
+    return candidateTitles.includes(normalizedInput);
+  });
+  const selected = exact ?? candidates[0]!;
+  const selectedTitle =
+    selected.title?.english?.trim() ||
+    selected.title?.romaji?.trim() ||
+    selected.title?.native?.trim() ||
+    title;
+  return {
+    id: selected.id,
+    title: selectedTitle,
+  };
+}
+
+function hasKanaOnly(value: string): boolean {
+  return /^[\u3040-\u309f\u30a0-\u30ffー]+$/.test(value);
+}
+
+function katakanaToHiragana(value: string): string {
+  let output = '';
+  for (const char of value) {
+    const code = char.charCodeAt(0);
+    if (code >= 0x30a1 && code <= 0x30f6) {
+      output += String.fromCharCode(code - 0x60);
+      continue;
+    }
+    output += char;
+  }
+  return output;
+}
+
+function buildReading(term: string): string {
+  const compact = term.replace(/\s+/g, '').trim();
+  if (!compact || !hasKanaOnly(compact)) {
+    return '';
+  }
+  return katakanaToHiragana(compact);
+}
+
+function buildNameTerms(character: CharacterRecord): string[] {
+  const base = new Set<string>();
+  const rawNames = [character.nativeName, character.fullName];
+  for (const rawName of rawNames) {
+    const name = rawName.trim();
+    if (!name) continue;
+    base.add(name);
+
+    const compact = name.replace(/[\s\u3000]+/g, '');
+    if (compact && compact !== name) {
+      base.add(compact);
+    }
+
+    const noMiddleDots = compact.replace(/[・･·•]/g, '');
+    if (noMiddleDots && noMiddleDots !== compact) {
+      base.add(noMiddleDots);
+    }
+
+    const split = name.split(/[\s\u3000]+/).filter((part) => part.trim().length > 0);
+    if (split.length === 2) {
+      base.add(split[0]!);
+      base.add(split[1]!);
+    }
+
+    const splitByMiddleDot = name
+      .split(/[・･·•]/)
+      .map((part) => part.trim())
+      .filter((part) => part.length > 0);
+    if (splitByMiddleDot.length >= 2) {
+      for (const part of splitByMiddleDot) {
+        base.add(part);
+      }
+    }
+  }
+
+  const withHonorifics = new Set<string>();
+  for (const entry of base) {
+    withHonorifics.add(entry);
+    for (const suffix of HONORIFIC_SUFFIXES) {
+      withHonorifics.add(`${entry}${suffix}`);
+    }
+  }
+
+  return [...withHonorifics].filter((entry) => entry.trim().length > 0);
+}
+
+function stripDescription(value: string): string {
+  return value.replace(/<[^>]+>/g, ' ').replace(/\s+/g, ' ').trim();
+}
+
+function normalizeDescription(value: string): string {
+  const stripped = stripDescription(value);
+  if (!stripped) return '';
+  return stripped
+    .replace(/\[([^\]]+)\]\((https?:\/\/[^)\s]+)\)/g, '$1')
+    .replace(/https?:\/\/\S+/g, '')
+    .replace(/__([^_]+)__/g, '$1')
+    .replace(/\*\*([^*]+)\*\*/g, '$1')
+    .replace(/~!/g, '')
+    .replace(/!~/g, '')
+    .replace(/\s+/g, ' ')
+    .trim();
+}
+
+function roleInfo(role: CharacterDictionaryRole): { tag: string; score: number } {
+  if (role === 'main') return { tag: 'main', score: 100 };
+  if (role === 'primary') return { tag: 'primary', score: 75 };
+  if (role === 'side') return { tag: 'side', score: 50 };
+  return { tag: 'appears', score: 25 };
+}
+
+function mapRole(input: string | null | undefined): CharacterDictionaryRole {
+  const value = (input || '').trim().toUpperCase();
+  if (value === 'MAIN') return 'main';
+  if (value === 'BACKGROUND') return 'appears';
+  if (value === 'SUPPORTING') return 'side';
+  return 'primary';
+}
+
+function roleLabel(role: CharacterDictionaryRole): string {
+  if (role === 'main') return 'Main';
+  if (role === 'primary') return 'Primary';
+  if (role === 'side') return 'Side';
+  return 'Appears';
+}
+
+function inferImageExt(contentType: string | null): string {
+  const normalized = (contentType || '').toLowerCase();
+  if (normalized.includes('png')) return 'png';
+  if (normalized.includes('gif')) return 'gif';
+  if (normalized.includes('webp')) return 'webp';
+  return 'jpg';
+}
+
+function ensureDir(dirPath: string): void {
+  if (fs.existsSync(dirPath)) return;
+  fs.mkdirSync(dirPath, { recursive: true });
+}
+
+function expandUserPath(input: string): string {
+  if (input.startsWith('~')) {
+    return path.join(os.homedir(), input.slice(1));
+  }
+  return input;
+}
+
+function isVideoFile(filePath: string): boolean {
+  const ext = path.extname(filePath).toLowerCase();
+  return VIDEO_EXTENSIONS.has(ext);
+}
+
+function findFirstVideoFileInDirectory(directoryPath: string): string | null {
+  const queue: string[] = [directoryPath];
+  while (queue.length > 0) {
+    const current = queue.shift()!;
+    let entries: fs.Dirent[] = [];
+    try {
+      entries = fs.readdirSync(current, { withFileTypes: true });
+    } catch {
+      continue;
+    }
+    entries.sort((a, b) => a.name.localeCompare(b.name));
+    for (const entry of entries) {
+      const fullPath = path.join(current, entry.name);
+      if (entry.isFile() && isVideoFile(fullPath)) {
+        return fullPath;
+      }
+      if (entry.isDirectory() && !entry.name.startsWith('.')) {
+        queue.push(fullPath);
+      }
+    }
+  }
+  return null;
+}
+
+function resolveDictionaryGuessInputs(targetPath: string): {
+  mediaPath: string;
+  mediaTitle: string | null;
+} {
+  const trimmed = targetPath.trim();
+  if (!trimmed) {
+    throw new Error('Dictionary target path is empty.');
+  }
+  const resolvedPath = path.resolve(expandUserPath(trimmed));
+  let stats: fs.Stats;
+  try {
+    stats = fs.statSync(resolvedPath);
+  } catch {
+    throw new Error(`Dictionary target path not found: ${targetPath}`);
+  }
+
+  if (stats.isFile()) {
+    return {
+      mediaPath: resolvedPath,
+      mediaTitle: path.basename(resolvedPath),
+    };
+  }
+
+  if (stats.isDirectory()) {
+    const firstVideo = findFirstVideoFileInDirectory(resolvedPath);
+    if (firstVideo) {
+      return {
+        mediaPath: firstVideo,
+        mediaTitle: path.basename(firstVideo),
+      };
+    }
+    return {
+      mediaPath: resolvedPath,
+      mediaTitle: path.basename(resolvedPath),
+    };
+  }
+
+  throw new Error(`Dictionary target must be a file or directory path: ${targetPath}`);
+}
+
+function readCache(cachePath: string): CharacterDictionaryCacheFile {
+  try {
+    const raw = fs.readFileSync(cachePath, 'utf8');
+    const parsed = JSON.parse(raw) as CharacterDictionaryCacheFile;
+    if (!parsed || typeof parsed !== 'object' || !parsed.anilistById) {
+      return { anilistById: {} };
+    }
+    return parsed;
+  } catch {
+    return { anilistById: {} };
+  }
+}
+
+function writeCache(cachePath: string, cache: CharacterDictionaryCacheFile): void {
+  ensureDir(path.dirname(cachePath));
+  fs.writeFileSync(cachePath, JSON.stringify(cache, null, 2), 'utf8');
+}
+
+function createDefinitionGlossary(
+  character: CharacterRecord,
+  mediaTitle: string,
+  imagePath: string | null,
+): Array<string | Record<string, unknown>> {
+  const displayName = character.nativeName || character.fullName || `Character ${character.id}`;
+  const lines: string[] = [`${displayName} [${roleLabel(character.role)}]`, `${mediaTitle} · AniList`];
+
+  const description = normalizeDescription(character.description);
+  if (description) {
+    lines.push(description);
+  }
+
+  if (!imagePath) {
+    return [lines.join('\n')];
+  }
+
+  const content: Array<string | Record<string, unknown>> = [
+    {
+      tag: 'img',
+      path: imagePath,
+      width: 8,
+      height: 11,
+      sizeUnits: 'em',
+      title: displayName,
+      alt: displayName,
+      description: `${displayName} · ${mediaTitle}`,
+      collapsed: false,
+      collapsible: false,
+      background: true,
+    },
+  ];
+
+  for (let i = 0; i < lines.length; i += 1) {
+    if (i > 0) {
+      content.push({ tag: 'br' });
+    }
+    content.push(lines[i]!);
+  }
+
+  return [
+    {
+      type: 'structured-content',
+      content,
+    },
+  ];
+}
+
+function buildTermEntry(
+  term: string,
+  reading: string,
+  role: CharacterDictionaryRole,
+  glossary: Array<string | Record<string, unknown>>,
+): Array<string | number | Array<string | Record<string, unknown>>> {
+  const { tag, score } = roleInfo(role);
+  return [term, reading, `name ${tag}`, '', score, glossary, 0, ''];
+}
+
+const CRC32_TABLE = (() => {
+  const table = new Uint32Array(256);
+  for (let i = 0; i < 256; i += 1) {
+    let crc = i;
+    for (let j = 0; j < 8; j += 1) {
+      crc = (crc & 1) !== 0 ? 0xedb88320 ^ (crc >>> 1) : crc >>> 1;
+    }
+    table[i] = crc >>> 0;
+  }
+  return table;
+})();
+
+function crc32(data: Buffer): number {
+  let crc = 0xffffffff;
+  for (const byte of data) {
+    crc = CRC32_TABLE[(crc ^ byte) & 0xff]! ^ (crc >>> 8);
+  }
+  return (crc ^ 0xffffffff) >>> 0;
+}
+
+function createStoredZip(files: Array<{ name: string; data: Buffer }>): Buffer {
+  const chunks: Buffer[] = [];
+  const entries: ZipEntry[] = [];
+  let offset = 0;
+
+  for (const file of files) {
+    const fileName = Buffer.from(file.name, 'utf8');
+    const fileData = file.data;
+    const fileCrc32 = crc32(fileData);
+    const local = Buffer.alloc(30 + fileName.length);
+    let cursor = 0;
+    local.writeUInt32LE(0x04034b50, cursor);
+    cursor += 4;
+    local.writeUInt16LE(20, cursor);
+    cursor += 2;
+    local.writeUInt16LE(0, cursor);
+    cursor += 2;
+    local.writeUInt16LE(0, cursor);
+    cursor += 2;
+    local.writeUInt16LE(0, cursor);
+    cursor += 2;
+    local.writeUInt16LE(0, cursor);
+    cursor += 2;
+    local.writeUInt32LE(fileCrc32, cursor);
+    cursor += 4;
+    local.writeUInt32LE(fileData.length, cursor);
+    cursor += 4;
+    local.writeUInt32LE(fileData.length, cursor);
+    cursor += 4;
+    local.writeUInt16LE(fileName.length, cursor);
+    cursor += 2;
+    local.writeUInt16LE(0, cursor);
+    cursor += 2;
+    fileName.copy(local, cursor);
+
+    chunks.push(local, fileData);
+    entries.push({
+      name: file.name,
+      data: fileData,
+      crc32: fileCrc32,
+      localHeaderOffset: offset,
+    });
+    offset += local.length + fileData.length;
+  }
+
+  const centralStart = offset;
+  const centralChunks: Buffer[] = [];
+  for (const entry of entries) {
+    const fileName = Buffer.from(entry.name, 'utf8');
+    const central = Buffer.alloc(46 + fileName.length);
+    let cursor = 0;
+    central.writeUInt32LE(0x02014b50, cursor);
+    cursor += 4;
+    central.writeUInt16LE(20, cursor);
+    cursor += 2;
+    central.writeUInt16LE(20, cursor);
+    cursor += 2;
+    central.writeUInt16LE(0, cursor);
+    cursor += 2;
+    central.writeUInt16LE(0, cursor);
+    cursor += 2;
+    central.writeUInt16LE(0, cursor);
+    cursor += 2;
+    central.writeUInt16LE(0, cursor);
+    cursor += 2;
+    central.writeUInt32LE(entry.crc32, cursor);
+    cursor += 4;
+    central.writeUInt32LE(entry.data.length, cursor);
+    cursor += 4;
+    central.writeUInt32LE(entry.data.length, cursor);
+    cursor += 4;
+    central.writeUInt16LE(fileName.length, cursor);
+    cursor += 2;
+    central.writeUInt16LE(0, cursor);
+    cursor += 2;
+    central.writeUInt16LE(0, cursor);
+    cursor += 2;
+    central.writeUInt16LE(0, cursor);
+    cursor += 2;
+    central.writeUInt16LE(0, cursor);
+    cursor += 2;
+    central.writeUInt32LE(0, cursor);
+    cursor += 4;
+    central.writeUInt32LE(entry.localHeaderOffset, cursor);
+    cursor += 4;
+    fileName.copy(central, cursor);
+    centralChunks.push(central);
+    offset += central.length;
+  }
+
+  const centralSize = offset - centralStart;
+  const end = Buffer.alloc(22);
+  let cursor = 0;
+  end.writeUInt32LE(0x06054b50, cursor);
+  cursor += 4;
+  end.writeUInt16LE(0, cursor);
+  cursor += 2;
+  end.writeUInt16LE(0, cursor);
+  cursor += 2;
+  end.writeUInt16LE(entries.length, cursor);
+  cursor += 2;
+  end.writeUInt16LE(entries.length, cursor);
+  cursor += 2;
+  end.writeUInt32LE(centralSize, cursor);
+  cursor += 4;
+  end.writeUInt32LE(centralStart, cursor);
+  cursor += 4;
+  end.writeUInt16LE(0, cursor);
+
+  return Buffer.concat([...chunks, ...centralChunks, end]);
+}
+
+async function fetchAniList<T>(
+  query: string,
+  variables: Record<string, unknown>,
+): Promise<T> {
+  const response = await fetch(ANILIST_GRAPHQL_URL, {
+    method: 'POST',
+    headers: {
+      'Content-Type': 'application/json',
+    },
+    body: JSON.stringify({
+      query,
+      variables,
+    }),
+  });
+  if (!response.ok) {
+    throw new Error(`AniList request failed (${response.status})`);
+  }
+  const payload = (await response.json()) as {
+    data?: T;
+    errors?: Array<{ message?: string }>;
+  };
+  const firstError = payload.errors?.find((entry) => entry && typeof entry.message === 'string');
+  if (firstError?.message) {
+    throw new Error(firstError.message);
+  }
+  if (!payload.data) {
+    throw new Error('AniList response missing data');
+  }
+  return payload.data;
+}
+
+async function resolveAniListMediaIdFromGuess(
+  guess: AnilistMediaGuess,
+): Promise<ResolvedAniListMedia> {
+  const data = await fetchAniList<AniListSearchResponse>(
+    `
+      query($search: String!) {
+        Page(perPage: 10) {
+          media(search: $search, type: ANIME, sort: [SEARCH_MATCH, POPULARITY_DESC]) {
+            id
+            episodes
+            title {
+              romaji
+              english
+              native
+            }
+          }
+        }
+      }
+    `,
+    {
+      search: guess.title,
+    },
+  );
+
+  const media = data.Page?.media ?? [];
+  const resolved = pickAniListSearchResult(guess.title, guess.episode, media);
+  if (!resolved) {
+    throw new Error(`No AniList media match found for "${guess.title}".`);
+  }
+  return resolved;
+}
+
+async function fetchCharactersForMedia(mediaId: number): Promise<{
+  mediaTitle: string;
+  characters: CharacterRecord[];
+}> {
+  const characters: CharacterRecord[] = [];
+  let page = 1;
+  let mediaTitle = '';
+  for (;;) {
+    const data = await fetchAniList<AniListCharacterPageResponse>(
+      `
+        query($id: Int!, $page: Int!) {
+          Media(id: $id, type: ANIME) {
+            title {
+              romaji
+              english
+              native
+            }
+            characters(page: $page, perPage: 50, sort: [ROLE, RELEVANCE, ID]) {
+              pageInfo {
+                hasNextPage
+              }
+              edges {
+                role
+                node {
+                  id
+                  description(asHtml: false)
+                  image {
+                    large
+                    medium
+                  }
+                  name {
+                    full
+                    native
+                  }
+                }
+              }
+            }
+          }
+        }
+      `,
+      {
+        id: mediaId,
+        page,
+      },
+    );
+
+    const media = data.Media;
+    if (!media) {
+      throw new Error(`AniList media ${mediaId} not found.`);
+    }
+    if (!mediaTitle) {
+      mediaTitle =
+        media.title?.english?.trim() ||
+        media.title?.romaji?.trim() ||
+        media.title?.native?.trim() ||
+        `AniList ${mediaId}`;
+    }
+
+    const edges = media.characters?.edges ?? [];
+    for (const edge of edges) {
+      const node = edge?.node;
+      if (!node || typeof node.id !== 'number') continue;
+      const fullName = node.name?.full?.trim() || '';
+      const nativeName = node.name?.native?.trim() || '';
+      if (!fullName && !nativeName) continue;
+      characters.push({
+        id: node.id,
+        role: mapRole(edge?.role),
+        fullName,
+        nativeName,
+        description: node.description || '',
+        imageUrl: node.image?.large || node.image?.medium || null,
+      });
+    }
+
+    const hasNextPage = Boolean(media.characters?.pageInfo?.hasNextPage);
+    if (!hasNextPage) {
+      break;
+    }
+    page += 1;
+    await sleep(300);
+  }
+
+  return {
+    mediaTitle,
+    characters,
+  };
+}
+
+async function downloadCharacterImage(imageUrl: string, charId: number): Promise<{
+  filename: string;
+  bytes: Buffer;
+} | null> {
+  try {
+    const response = await fetch(imageUrl);
+    if (!response.ok) return null;
+    const bytes = Buffer.from(await response.arrayBuffer());
+    if (bytes.length === 0) return null;
+    const ext = inferImageExt(response.headers.get('content-type'));
+    return {
+      filename: `c${charId}.${ext}`,
+      bytes,
+    };
+  } catch {
+    return null;
+  }
+}
+
+function buildDictionaryTitle(mediaId: number): string {
+  return `SubMiner Character Dictionary (AniList ${mediaId})`;
+}
+
+function createIndex(mediaId: number, mediaTitle: string, revision: string): Record<string, unknown> {
+  const dictionaryTitle = buildDictionaryTitle(mediaId);
+  return {
+    title: dictionaryTitle,
+    revision,
+    format: 3,
+    author: 'SubMiner',
+    description: `Character names from ${mediaTitle} [AniList media ID ${mediaId}]`,
+  };
+}
+
+function createTagBank(): Array<[string, string, number, string, number]> {
+  return [
+    ['name', 'partOfSpeech', 0, 'Character name', 0],
+    ['main', 'name', 0, 'Protagonist', 0],
+    ['primary', 'name', 0, 'Main character', 0],
+    ['side', 'name', 0, 'Side character', 0],
+    ['appears', 'name', 0, 'Minor appearance', 0],
+  ];
+}
+
+export function createCharacterDictionaryRuntimeService(deps: CharacterDictionaryRuntimeDeps): {
+  generateForCurrentMedia: (
+    targetPath?: string,
+    options?: CharacterDictionaryGenerateOptions,
+  ) => Promise<CharacterDictionaryBuildResult>;
+} {
+  const outputDir = path.join(deps.userDataPath, 'character-dictionaries');
+  const cachePath = path.join(outputDir, 'cache.json');
+
+  return {
+    generateForCurrentMedia: async (
+      targetPath?: string,
+      options?: CharacterDictionaryGenerateOptions,
+    ) => {
+      const dictionaryTarget = targetPath?.trim() || '';
+      const guessInput =
+        dictionaryTarget.length > 0
+          ? resolveDictionaryGuessInputs(dictionaryTarget)
+          : {
+              mediaPath: deps.getCurrentMediaPath(),
+              mediaTitle: deps.getCurrentMediaTitle(),
+            };
+      const mediaPathForGuess = deps.resolveMediaPathForJimaku(guessInput.mediaPath);
+      const mediaTitle = guessInput.mediaTitle;
+      const guessed = await deps.guessAnilistMediaInfo(mediaPathForGuess, mediaTitle);
+      if (!guessed || !guessed.title.trim()) {
+        throw new Error('Unable to resolve current anime from media path/title.');
+      }
+
+      const resolvedMedia = await resolveAniListMediaIdFromGuess(guessed);
+      const cache = readCache(cachePath);
+      const cached = cache.anilistById[String(resolvedMedia.id)];
+      const refreshTtlMsRaw = options?.refreshTtlMs;
+      const hasRefreshTtl =
+        typeof refreshTtlMsRaw === 'number' && Number.isFinite(refreshTtlMsRaw) && refreshTtlMsRaw > 0;
+      const now = deps.now();
+      const cacheAgeMs =
+        cached && typeof cached.updatedAt === 'number' && Number.isFinite(cached.updatedAt)
+          ? Math.max(0, now - cached.updatedAt)
+          : Number.POSITIVE_INFINITY;
+      const isCacheFresh = !hasRefreshTtl || cacheAgeMs <= refreshTtlMsRaw;
+      const isCacheFormatCurrent =
+        cached?.formatVersion === undefined
+          ? false
+          : cached.formatVersion >= CHARACTER_DICTIONARY_FORMAT_VERSION;
+      if (cached?.zipPath && fs.existsSync(cached.zipPath) && isCacheFresh && isCacheFormatCurrent) {
+        deps.logInfo?.(
+          `[dictionary] cache hit for AniList ${resolvedMedia.id}: ${path.basename(cached.zipPath)}`,
+        );
+        return {
+          zipPath: cached.zipPath,
+          fromCache: true,
+          mediaId: cached.mediaId,
+          mediaTitle: cached.mediaTitle,
+          entryCount: cached.entryCount,
+          dictionaryTitle: cached.dictionaryTitle ?? buildDictionaryTitle(cached.mediaId),
+          revision: cached.revision,
+        };
+      }
+
+      const { mediaTitle: fetchedMediaTitle, characters } = await fetchCharactersForMedia(
+        resolvedMedia.id,
+      );
+      if (characters.length === 0) {
+        throw new Error(`No characters returned for AniList media ${resolvedMedia.id}.`);
+      }
+
+      ensureDir(outputDir);
+      const zipFiles: Array<{ name: string; data: Buffer }> = [];
+      const termEntries: Array<Array<string | number | Array<string | Record<string, unknown>>>> =
+        [];
+      const seen = new Set<string>();
+
+      for (const character of characters) {
+        let imagePath: string | null = null;
+        if (character.imageUrl) {
+          const image = await downloadCharacterImage(character.imageUrl, character.id);
+          if (image) {
+            imagePath = `img/${image.filename}`;
+            zipFiles.push({
+              name: imagePath,
+              data: image.bytes,
+            });
+          }
+        }
+        const glossary = createDefinitionGlossary(character, fetchedMediaTitle, imagePath);
+        const candidateTerms = buildNameTerms(character);
+        for (const term of candidateTerms) {
+          const reading = buildReading(term);
+          const dedupeKey = `${term}|${reading}|${character.role}`;
+          if (seen.has(dedupeKey)) continue;
+          seen.add(dedupeKey);
+          termEntries.push(buildTermEntry(term, reading, character.role, glossary));
+        }
+      }
+
+      if (termEntries.length === 0) {
+        throw new Error('No dictionary entries generated from AniList character data.');
+      }
+
+      const revision = String(now);
+      const dictionaryTitle = buildDictionaryTitle(resolvedMedia.id);
+      zipFiles.push({
+        name: 'index.json',
+        data: Buffer.from(
+          JSON.stringify(createIndex(resolvedMedia.id, fetchedMediaTitle, revision), null, 2),
+          'utf8',
+        ),
+      });
+      zipFiles.push({
+        name: 'tag_bank_1.json',
+        data: Buffer.from(JSON.stringify(createTagBank()), 'utf8'),
+      });
+
+      const entriesPerBank = 10_000;
+      for (let i = 0; i < termEntries.length; i += entriesPerBank) {
+        const chunk = termEntries.slice(i, i + entriesPerBank);
+        zipFiles.push({
+          name: `term_bank_${Math.floor(i / entriesPerBank) + 1}.json`,
+          data: Buffer.from(JSON.stringify(chunk), 'utf8'),
+        });
+      }
+
+      const zipBuffer = createStoredZip(zipFiles);
+      const zipPath = path.join(outputDir, `anilist-${resolvedMedia.id}.zip`);
+      fs.writeFileSync(zipPath, zipBuffer);
+
+      const cacheEntry: CharacterDictionaryCacheEntry = {
+        mediaId: resolvedMedia.id,
+        mediaTitle: fetchedMediaTitle,
+        entryCount: termEntries.length,
+        zipPath,
+        updatedAt: now,
+        formatVersion: CHARACTER_DICTIONARY_FORMAT_VERSION,
+        dictionaryTitle,
+        revision,
+      };
+      cache.anilistById[String(resolvedMedia.id)] = cacheEntry;
+      writeCache(cachePath, cache);
+
+      deps.logInfo?.(
+        `[dictionary] generated AniList ${resolvedMedia.id}: ${termEntries.length} terms -> ${zipPath}`,
+      );
+
+      return {
+        zipPath,
+        fromCache: false,
+        mediaId: resolvedMedia.id,
+        mediaTitle: fetchedMediaTitle,
+        entryCount: termEntries.length,
+        dictionaryTitle,
+        revision,
+      };
+    },
+  };
+}