From e029e898e9cda6f838e12068480dab9cf9df10bc Mon Sep 17 00:00:00 2001
From: admin <admin@eswiig.com>
Date: Fri, 22 May 2026 21:39:09 +0200
Subject: [PATCH] Initial snapshot before step 10 package split

---
 .gitignore                                 |    7 +
 AGENTS.md                                  |   71 +
 CLAUDE.md                                  |    1 +
 CLAUDE.md.bak                              |   59 +
 README.md                                  |  233 ++
 TODO.md                                    |    9 +
 config.json                                |    5 +
 fixtures/README.md                         |   83 +
 fixtures/filename-extraction.json          |   24 +
 fixtures/query-extraction.json             |   22 +
 fixtures/run.py                            |   70 +
 fixtures/shared-normalization.json         |   17 +
 mockups/console-consolidation-claude.html  |  695 ++++++
 mockups/console-consolidation-options.html |  355 ++++
 rc-jav.py                                  | 2230 ++++++++++++++++++++
 tests/test_rules.py                        |   74 +
 16 files changed, 3955 insertions(+)
 create mode 100644 .gitignore
 create mode 100644 AGENTS.md
 create mode 100644 CLAUDE.md
 create mode 100644 CLAUDE.md.bak
 create mode 100644 README.md
 create mode 100644 TODO.md
 create mode 100644 config.json
 create mode 100644 fixtures/README.md
 create mode 100644 fixtures/filename-extraction.json
 create mode 100644 fixtures/query-extraction.json
 create mode 100644 fixtures/run.py
 create mode 100644 fixtures/shared-normalization.json
 create mode 100644 mockups/console-consolidation-claude.html
 create mode 100644 mockups/console-consolidation-options.html
 create mode 100644 rc-jav.py
 create mode 100644 tests/test_rules.py

diff --git a/.gitignore b/.gitignore
new file mode 100644
index 0000000..432eb49
--- /dev/null
+++ b/.gitignore
@@ -0,0 +1,7 @@
+__pycache__/
+*.pyc
+scan-cancel.flag
+cache.json
+cache.json.tmp
+reports/
+.claude/
diff --git a/AGENTS.md b/AGENTS.md
new file mode 100644
index 0000000..dd71142
--- /dev/null
+++ b/AGENTS.md
@@ -0,0 +1,71 @@
+# rc-jav (Python CLI)
+
+Session memory for Codex. Read before making changes here.
+
+## What this is
+
+A read-only rclone library comparison + search CLI. Compares `cq:JAV` remote (rclone crypt) against itself (dupe detection) or against external WinCatalog CSV/XML exports. Powers the rclone-jav Brave extension via native messaging.
+
+## Architecture
+
+```
+rc-jav.py
+  ├── reads config.json (default_target etc.)
+  ├── reads cache.json (per-remote file index, written by --scan)
+  ├── shells out to: rclone lsf / rclone lsjson / rclone size --json
+  ├── extract_id() per filename → normalized ID with optional #partN / variant suffix
+  ├── two query modes: --quick (live rclone --include glob) and cached (uses cache.json)
+  └── output: rich tables (default) | --basic plain | --format json (for extension)
+```
+
+## Files
+
+```
+D:\DEV\Project\rclone-jav\
+├── rc-jav.py             single-file CLI
+├── config.json           default_source/target/catalog (user-editable via --save)
+├── cache.json            scanned remote file index (written by --scan)
+├── wincatalog\           drop WinCatalog CSV/XML exports here (auto-loaded)
+├── TODO.md               deferred work
+└── README.md
+```
+
+## Companion project
+
+`D:\DEV\Extensions\Production\rclone-jav\` (PC 1) / `D:\DEV\Extensions\Staging\rclone-jav\` (PC 2) — Brave extension + native messaging host that shells out to `rc-jav.py` for searches.
+
+## ID normalization
+
+- `extract_id()` chops trailing single letters (e.g. `IBW-902z.mp4` → `IBW-902`). Decision is intentional — see extension's AGENTS.md "Decision log".
+- JAV IDs are canonicalized with at least 3 digits (`ABC-27` → `ABC-027`); 4+ digit IDs keep their width (`ABCD-1294`). User expects real JAV IDs to be `ABC-027`, never `ABC-27` or `ABC-0027`.
+- Part suffix detection: `_1`, `-pt1`, `(1)` → appended as `#partN` for distinctness.
+- Compound prefixes (`FC2-PPV-123`) handled via secondary regex.
+- Search matcher does prefix lookup so `IBW-902` finds both `IBW-902` and `IBW-902#part1` etc.
+- Quick search must emit only canonical padded uppercase globs (`ABC-027*`, `ABCDE-1167*`). Do not add `--ignore-case`; user never uses lowercase filenames and it caused noticeable delay.
+
+## Defaults from earlier sessions
+
+- `cq:JAV` is the current remote root (after the rclone crypt config change moved it down a level)
+- `default_target` in config.json = `["cq:JAV"]`
+- `human_size()` formats to 2 decimals (e.g. `6.94 GiB`)
+- After the 3-digit ID canonicalization change, run `python rc-jav.py --scan` to rebuild `cache.json` under the new padded keys.
+- Duplicate KEEP ranking uses configurable VIP folders before source/size/format ranking. Default VIP folder is `ClearJAV`; video files there are treated as the trusted direct-rip copy.
+- Duplicate KEEP ranking treats `.ts` as the lowest-priority video container when any non-`.ts` duplicate is available.
+
+## Recent decisions / bug fixes
+
+- `--format json` should keep stdout as clean JSON. Status/progress text belongs on stderr in JSON mode.
+- Catalog rows are informational. CSV exports mark them as `CATALOG`; JSON exports put them under `catalog`, not `delete_candidates`.
+- Cache loading validates the top-level shape and falls back to an empty cache when `remotes` is missing or malformed.
+- The old `--recursive/-R` flag was removed because scans are always recursive (`rclone lsf -R` / quick `lsjson -R`).
+
+## TODO
+
+See `TODO.md` for deferred work.
+
+## When making changes
+
+- Adding CLI flags: also update host invocation in `D:\DEV\Extensions\Production\rclone-jav\host\rcjav-host.py` if the flag matters to the extension
+- Changing `extract_id()` semantics: forces a `--scan` to rebuild cache under new keys, and may need a parallel change in extension's `normalizeId()`
+- JSON output format changes: extension's popup.js / overlay rendering reads `structured` array — keep field names stable (`source`, `remote`, `path`, `full_path`, `size`, `size_human`, `mod_time`, `jav_id`)
+- Config schema: update `--save` writer and any defaults
diff --git a/CLAUDE.md b/CLAUDE.md
new file mode 100644
index 0000000..43c994c
--- /dev/null
+++ b/CLAUDE.md
@@ -0,0 +1 @@
+@AGENTS.md
diff --git a/CLAUDE.md.bak b/CLAUDE.md.bak
new file mode 100644
index 0000000..3b425fe
--- /dev/null
+++ b/CLAUDE.md.bak
@@ -0,0 +1,59 @@
+# rc-jav (Python CLI)
+
+Session memory for Claude. Read before making changes here.
+
+## What this is
+
+A read-only rclone library comparison + search CLI. Compares `cq:JAV` remote (rclone crypt) against itself (dupe detection) or against external WinCatalog CSV/XML exports. Powers the rclone-jav Brave extension via native messaging.
+
+## Architecture
+
+```
+rc-jav.py
+  ├── reads config.json (default_target etc.)
+  ├── reads cache.json (per-remote file index, written by --scan)
+  ├── shells out to: rclone lsf / rclone lsjson / rclone size --json
+  ├── extract_id() per filename → normalized ID with optional #partN / variant suffix
+  ├── two query modes: --quick (live rclone --include glob) and cached (uses cache.json)
+  └── output: rich tables (default) | --basic plain | --format json (for extension)
+```
+
+## Files
+
+```
+D:\DEV\Project\rclone-jav\
+├── rc-jav.py             single-file CLI
+├── config.json           default_source/target/catalog (user-editable via --save)
+├── cache.json            scanned remote file index (written by --scan)
+├── wincatalog\           drop WinCatalog CSV/XML exports here (auto-loaded)
+├── TODO.md               deferred work
+└── README.md
+```
+
+## Companion project
+
+`D:\DEV\Extensions\Production\rclone-jav\` (PC 1) / `D:\DEV\Extensions\Staging\rclone-jav\` (PC 2) — Brave extension + native messaging host that shells out to `rc-jav.py` for searches.
+
+## ID normalization
+
+- `extract_id()` chops trailing single letters (e.g. `IBW-902z.mp4` → `IBW-902`). Decision is intentional — see extension's CLAUDE.md "Decision log".
+- Part suffix detection: `_1`, `-pt1`, `(1)` → appended as `#partN` for distinctness.
+- Compound prefixes (`FC2-PPV-123`) handled via secondary regex.
+- Search matcher does prefix lookup so `IBW-902` finds both `IBW-902` and `IBW-902#part1` etc.
+
+## Defaults from earlier sessions
+
+- `cq:JAV` is the current remote root (after the rclone crypt config change moved it down a level)
+- `default_target` in config.json = `["cq:JAV"]`
+- `human_size()` formats to 2 decimals (e.g. `6.94 GiB`)
+
+## TODO
+
+See `TODO.md`. Current item: WinCatalog `\` → `/` path normalization in load_catalog_*.
+
+## When making changes
+
+- Adding CLI flags: also update host invocation in `D:\DEV\Extensions\Production\rclone-jav\host\rcjav-host.py` if the flag matters to the extension
+- Changing `extract_id()` semantics: forces a `--scan` to rebuild cache under new keys, and may need a parallel change in extension's `normalizeId()`
+- JSON output format changes: extension's popup.js / overlay rendering reads `structured` array — keep field names stable (`source`, `remote`, `path`, `full_path`, `size`, `size_human`, `mod_time`, `jav_id`)
+- Config schema: update `--save` writer and any defaults
diff --git a/README.md b/README.md
new file mode 100644
index 0000000..08a99d2
--- /dev/null
+++ b/README.md
@@ -0,0 +1,233 @@
+# rc-jav
+
+Read-only duplicate scanner for JAV files across rclone remotes. Groups files by JAV ID (e.g. `SSIS-001`) and reports which copy to keep based on priority rules.
+
+## Priority rules
+
+1. Video files inside configured **VIP folders** win first. Default VIP folder: `ClearJAV`.
+2. If no VIP-folder video exists, **Source always wins** regardless of resolution/size.
+3. `.ts` files rank below other video containers, even when the transport-stream copy is larger.
+4. If no Source copy exists in the group, **largest file size wins** among the remaining Targets.
+5. Suggestions only — script never deletes. Manual cleanup.
+
+## ID matching
+
+Filename stem is matched against:
+
+- Primary: `^([A-Za-z]+)-(\d+)` — `SSIS-001`, `MIDV-123`, `ABP-456`
+- Compound: `^(\w+(?:-\w+)+)-(\d+)` — `FC2-PPV-4894535`, `HEYZO-HD-1234`
+- Fallback: `^([A-Za-z0-9]+)-(\d+)` — `1pondo-123`, `carib-456`
+
+IDs normalized to uppercase with leading zeros stripped from the number (so `ssis-001` == `SSIS-1` == `SSIS-001`). Anything after the ID (` - Actress [1080p]`) is ignored for matching.
+
+### Part-suffix handling
+
+Multi-part files (`_1`, `_2`, `-1`, `-2`, `_A`, `_B`, `.1of4`, ` (1)`, `-pt1`, `-part1`, `-cd1`, `-disc1`, trailing ` N`) are normalized as `{ID}#partN` so they do not collide as false duplicates. Searching the base ID still finds all parts. Lettered `_A` / `_B` suffixes become part 1 / part 2.
+
+Add more suffix shapes with repeatable `--part-pattern` regexes. The first capture group is the part number or one part letter and the pattern runs against the filename stem:
+
+```powershell
+python rc-jav.py --scan --part-pattern '[-_ ]side[-_ ]?(A|B)$'
+python rc-jav.py --part-pattern '_([CD])$' --save
+```
+
+Saved rules live in `config.json` as `part_patterns`. The extension Options page has the same custom part detector list for host-triggered searches, duplicate review, and cache rebuilds.
+
+Files with no parseable ID are listed under "Skipped" at the end so you can spot misnamed files.
+
+### Rule checks
+
+Focused rule tests cover ID extraction, multipart grouping safety, and duplicate KEEP ranking:
+
+```powershell
+python -B -m unittest discover -s tests -v
+```
+
+## Usage
+
+```
+python rc-jav.py \
+  --source cq:personal-files/ClearJAV/ichika-matsumoto \
+  --target cq:personal-files/JAV/TMP \
+```
+
+Flags:
+- `--source` / `-s REMOTE` — priority remote path. Repeat for multiple.
+- `--target` / `-t REMOTE` — non-priority remote path. Repeat for multiple.
+- `--format {console,txt,csv,json,all}` — default `console`. Non-console formats write to `--output-dir`.
+- `--output-dir DIR` — default `./reports`.
+- `--no-color` — disable ANSI colors but keep rich layout (tables, panels).
+- `--basic` — plain text output, no rich tables/panels. Progress ticks every 25 files on stderr. Useful for piping or simple terminals.
+- `--rclone-bin PATH` — path to rclone executable (default: `rclone` on PATH). Example: `--rclone-bin C:\Programs\rclone\rclone.exe`.
+- `--clearjav` — shortcut: sets source = `DEFAULT_SOURCE`, target = `DEFAULT_TARGET`. Equivalent to `--source cq:personal-files/ClearJAV --target cq:personal-files/JAV/TMP`. Combine with `--source`/`--target` to override one side.
+
+Examples:
+
+```
+# full library dupe scan, one flag
+python rc-jav.py --clearjav
+
+# same but only check one actress folder against TMP
+python rc-jav.py --clearjav --source cq:personal-files/ClearJAV/ichika-matsumoto
+```
+
+## Search mode
+
+Check whether a JAV ID already exists in your library before downloading:
+
+```
+python rc-jav.py --search SSIS-001
+python rc-jav.py --search SSIS-001 --search FC2-PPV-4894535
+
+# wildcards (quote to avoid shell glob expansion)
+python rc-jav.py --search "IPZZ-*"
+python rc-jav.py --search "FC2-PPV-*"
+python rc-jav.py --search "SSIS-???"     # exact 3-digit numeric
+```
+
+Wildcard syntax: `*` (any chars) and `?` (one char), case-insensitive. Matches against normalized IDs in the index, including `#partN` suffixes automatically.
+
+Range syntax: `[N-M]` inclusive both ends. Works inside any prefix.
+
+```
+python rc-jav.py --search "IPZZ-[820-860]"
+python rc-jav.py --search "FC2-PPV-[4894500-4894600]"
+python rc-jav.py --search "MIDV-[001-010]"   # zero-padding preserved
+```
+
+Quote in PowerShell/bash so `[...]` reaches Python literally. Reversed ranges (`860-820`) auto-swap.
+
+With no `--source` / `--target` flags, only `DEFAULT_TARGET` (TMP) is scanned — the typical case for "do I already have this in my unsorted pile?". Pass `--source cq:personal-files/ClearJAV` to also check the priority library. Edit `DEFAULT_SOURCE` / `DEFAULT_TARGET` at the top of the script to change defaults. Remote scans are recursive.
+
+Exit code: `0` if every query had at least one hit, `1` otherwise — useful for shell automation.
+
+## Name search (`--name`)
+
+Substring search against filenames (case-insensitive). Find all files by actress, studio, tag, anything that appears in the filename.
+
+```
+python rc-jav.py --name Ichika
+python rc-jav.py --name "Ichika Matsumoto"
+python rc-jav.py --name Ichika --name Yui          # OR — files matching either
+python rc-jav.py --name "Mat*"                     # glob wildcard
+python rc-jav.py --search IPZZ-860 --name Ichika   # both — separate result blocks
+```
+
+- Multiple `--name` tokens = OR. Use one combined `--name "foo bar"` for AND/exact-substring.
+- Matches against the filename stem only (not folder names).
+- Auto-routes to **cached** mode because substring globs can't be server-side filtered on most backends. Pass `-q` to force quick anyway (slower).
+
+### Smart search mode (auto quick / cached)
+
+The script auto-picks the right execution path per query and prints which one it chose:
+
+| Query shape | Picked mode | Reason |
+|---|---|---|
+| Single exact ID (`IPZZ-860`) | quick | live rclone `--include`, ~1–2s even on huge trees |
+| Wildcard (`IPZZ-*`, `SSIS-???`) | cached | reliable normalized matching |
+| Range (`IPZZ-[820-860]`) | cached | avoids N rclone calls |
+| Multiple `--search` flags | cached | warmup amortizes |
+
+Override:
+- `--quick` / `-q` — force live rclone lookup (skips cache).
+- `--cache` — force cache (builds it if cold).
+
+Quick mode never reads or writes the cache. Cache mode honors `--update` and `--no-cache` as before.
+
+### Cache
+
+Search mode caches each remote's file list in `./cache.json` next to the script. Subsequent searches are near-instant.
+
+- First run: scans + writes cache.
+- Later runs: reads cache (banner shows `CACHED 14m (154 files)`).
+- `--update` / `-u`: force re-scan + overwrite cache for the requested remotes.
+- `--no-cache`: bypass cache (no read, no write).
+- Stale warning when cache is older than 24h — still used, marked `CACHED-STALE`.
+- Ctrl+C during a scan: rclone is terminated, cache for in-flight remote is NOT written.
+
+Delete `cache.json` to reset everything.
+
+### Saving defaults (--save)
+
+Persist `--source`, `--target`, `--catalog`, and/or `--part-pattern` to `config.json` so you don't have to type them every run.
+
+```
+# set default target
+python rc-jav.py --target cq:personal-files/JAV/TMP --save
+
+# set source + multiple targets at once
+python rc-jav.py --source cq:personal-files/ClearJAV ^
+                 --target cq:personal-files/JAV/TMP ^
+                 --target cq:personal-files/JAV/SORTED ^
+                 --save
+
+# inspect
+type config.json
+```
+
+Only the keys you explicitly pass are written — running `--save --target X` won't wipe a saved `default_source`. Delete `config.json` to reset to the hardcoded defaults at the top of `rc-jav.py`.
+
+### Scan-only (--scan)
+
+Refresh the cache without running a search or dupe report — useful for Task Scheduler / cron pre-warming.
+
+```
+# default: refresh DEFAULT_TARGET (TMP)
+python rc-jav.py --scan
+
+# refresh both source and target
+python rc-jav.py --scan --source cq:personal-files/ClearJAV --target cq:personal-files/JAV/TMP
+
+# nightly via Task Scheduler
+schtasks /Create /SC DAILY /ST 03:00 /TN "rc-jav nightly scan" ^
+  /TR "python D:\DEV\Project\rclone-jav\rc-jav.py --scan --basic"
+```
+
+`--scan` always overwrites the cache for the remotes you list. Exit 0 = success, non-zero = rclone failure.
+
+```
+python rc-jav.py --search MIDV-999 ; if ($LASTEXITCODE -eq 0) { "have it" } else { "download" }
+```
+
+## WinCatalog integration
+
+WinCatalog's native `.wcat` format is proprietary, so the script reads its exports instead.
+
+1. In WinCatalog: **File → Export** → choose **CSV** or **XML**.
+2. Save into the `wincatalog/` folder next to the script. All `*.csv` and `*.xml` files there are auto-loaded — drop in as many discs as you want.
+3. Run as normal: `python rc-jav.py --search IPZZ-860`
+4. Override or add extra paths with `--catalog PATH` (file or folder, repeatable).
+5. To change the default folder, edit `DEFAULT_CATALOG` at the top of the script.
+
+Re-export when your catalog changes; the script re-reads on every run (catalog data is **not** cached — it's already a local file).
+
+**Role of catalog hits:**
+- Search: shown as rows with source label `Catalog`. The disc/volume name is encoded into the path so you know which offline backup holds the file.
+- Dupe mode: catalog entries appear in groups for awareness but are **never marked KEEP or DELETE?** — they're offline, can't be touched. A group is only flagged as a dupe when 2+ rclone copies exist.
+
+**CSV column auto-detection** (case-insensitive, first match wins):
+- Name: `Name`, `File Name`, `Filename`, `Title`
+- Path: `Path`, `Full Path`, `Location`, `Folder`
+- Size: `Size`, `File Size`, `Bytes`, `Size (bytes)`
+- Disc: `Disc`, `Disc Name`, `Disc Label`, `Volume`, `Source`, `Catalog`, `Media`
+
+XML: walks the tree, treats `<File>` / `<f>` nodes inside `<Disc>` / `<Catalog>` / `<Volume>` containers, with `<Folder>` nesting.
+
+## Requirements
+
+- Python 3.9+
+- `pip install rich` (used for progress bars + themed output)
+- `rclone` on `PATH` with the relevant remotes configured.
+
+## UI
+
+- Live per-file progress bar during scans (`rclone size --json` for total, then `rclone lsf --files-only -R --format pst` streamed).
+- Banner panel showing run mode + per-remote cache status.
+- Rich tables for search hits and duplicate groups.
+- `--no-color` for plain output (CI, piping).
+
+## Roadmap
+
+- Phase 1 (current): report duplicates + search.
+- Phase 2: `--apply` mode that runs `rclone delete` on `DELETE?` candidates behind a confirmation gate.
+- Phase 3: resolution-aware tiebreakers, move-to-review folder, scheduled runs.
diff --git a/TODO.md b/TODO.md
new file mode 100644
index 0000000..f831295
--- /dev/null
+++ b/TODO.md
@@ -0,0 +1,9 @@
+# TODO / Deferred work
+
+## Deferred
+
+(append below)
+
+## Completed notes
+
+- WinCatalog CSV/XML paths are normalized from `\` to `/` during catalog load.
diff --git a/config.json b/config.json
new file mode 100644
index 0000000..496030f
--- /dev/null
+++ b/config.json
@@ -0,0 +1,5 @@
+{
+  "default_target": [
+    "cq:JAV"
+  ]
+}
\ No newline at end of file
diff --git a/fixtures/README.md b/fixtures/README.md
new file mode 100644
index 0000000..2a00990
--- /dev/null
+++ b/fixtures/README.md
@@ -0,0 +1,83 @@
+# Shared JAV ID fixture corpus
+
+JSON cases shared between the Python `rc-jav.py` CLI and the browser
+extension at `D:\DEV\Extensions\Production\rclone-jav\`. Each side
+reads the cases relevant to its own extraction surface.
+
+## Files
+
+| File                          | Domain   | Consumer                               | Notes |
+|-------------------------------|----------|----------------------------------------|-------|
+| `filename-extraction.json`    | filename | Python `extract_id(name)`              | Has `#partN` expectations for multipart files |
+| `query-extraction.json`       | query    | Extension `content.js` `normalizeId`   | Looser context; extension never emits part suffix |
+| `shared-normalization.json`   | shared   | BOTH                                   | Contract: any mismatch here is a bug, not a fixture issue |
+
+All files share the same shape:
+
+```json
+{
+  "version": 1,
+  "domain": "…",
+  "description": "…",
+  "case_schema": { … },
+  "cases": [
+    { "name": "…", "input": "…", "expected": "…" }
+  ]
+}
+```
+
+`expected: null` means "no ID should be detected".
+
+## Running the Python side
+
+```bash
+python fixtures/run.py
+```
+
+The runner imports `rc-jav.py` in place, exercises `extract_id` against
+`filename-extraction.json`, and `normalize_id` against
+`shared-normalization.json`. Exit code is non-zero on any failure.
+
+## Running the extension side
+
+No automated runner today. `content.js` lives inside an IIFE that the
+browser injects into pages, so importing it from Node would require
+either an extraction refactor or a duplicated copy of the regex. Until
+that lands, treat `query-extraction.json` and `shared-normalization.json`
+as the canonical specification: if you touch `ID_RE_DASHED`,
+`ID_RE_UNDASHED`, or `BUILTIN_ID_NORMALIZERS` in content.js, eyeball
+this corpus and confirm the cases still describe expected behavior.
+
+## Adding a case
+
+1. Pick the file matching the surface you're testing.
+2. Append a `{ "name", "input", "expected" }` entry. Keep `name`
+   descriptive — it's the only label shown when the runner fails.
+3. If the case exercises a guarantee both sides must honor, add it to
+   `shared-normalization.json` as well.
+4. Run `python fixtures/run.py` to confirm Python still passes.
+
+## Known cross-side divergences (intentional)
+
+These are NOT bugs — they reflect the different surfaces each side
+extracts from. Recorded here so future contributors don't try to
+"fix" them.
+
+- **`FC2PPV1841460` compact form (no dashes).** The extension's
+  `BUILTIN_ID_NORMALIZERS` in `content.js` rewrites this to
+  `FC2-PPV-1841460` when seen in page titles. Python `extract_id`
+  does NOT — the compact form doesn't realistically appear in
+  filenames on disk. Hence the case lives in
+  `query-extraction.json` only, not in `filename-extraction.json` or
+  `shared-normalization.json`.
+
+If a case belongs to one side's contract but not the other's, file it
+under the specific domain (`filename-` or `query-`) — not under
+`shared-`.
+
+## Ownership
+
+This directory lives in the Python repo only because the Python repo
+is the more stable root. Conceptually it's joint property of both
+codebases. Don't add anything Python-specific to the JSON files — keep
+them tool-neutral.
diff --git a/fixtures/filename-extraction.json b/fixtures/filename-extraction.json
new file mode 100644
index 0000000..fc656b6
--- /dev/null
+++ b/fixtures/filename-extraction.json
@@ -0,0 +1,24 @@
+{
+  "version": 1,
+  "domain": "filename",
+  "description": "Filename → canonical JAV ID (with optional #partN suffix). Consumed by Python rc-jav.extract_id.",
+  "case_schema": {
+    "name": "human label",
+    "input": "filename including extension",
+    "expected": "canonical ID (e.g. ABC-001 or ABC-001#part1) or null when no ID present"
+  },
+  "cases": [
+    { "name": "plain dashed ID",                       "input": "ABC-027.mp4",                            "expected": "ABC-027" },
+    { "name": "dashed ID with resolution tag",         "input": "SCOP-297 [1080p].mp4",                   "expected": "SCOP-297" },
+    { "name": "bracket-wrapped ID",                    "input": "[REAL-779].mp4",                         "expected": "REAL-779" },
+    { "name": "bracket-wrapped ID with extra tag",     "input": "[SCOP-297] [1080p].mp4",                 "expected": "SCOP-297" },
+    { "name": "no-hyphen fallback",                    "input": "MVSD312.avi",                            "expected": "MVSD-312" },
+    { "name": "trailing lowercase variant letter",     "input": "IBW-902z.mp4",                           "expected": "IBW-902z" },
+    { "name": "multipart _PART suffix",                "input": "KV-118 - Aiba Reika_PART1.mp4",          "expected": "KV-118#part1" },
+    { "name": "multipart _A letter suffix",            "input": "KV-118_A.mp4",                           "expected": "KV-118#part1" },
+    { "name": "multipart trailing -N before bracket",  "input": "OFJE-195-7 [480p].mp4",                  "expected": "OFJE-195#part7" },
+    { "name": "FC2 PPV plain",                         "input": "FC2-1841460.mp4",                        "expected": "FC2-PPV-1841460" },
+    { "name": "FC2 PPV explicit",                      "input": "FC2-PPV-1841460.mp4",                    "expected": "FC2-PPV-1841460" },
+    { "name": "no ID present",                         "input": "random_video.mp4",                       "expected": null }
+  ]
+}
diff --git a/fixtures/query-extraction.json b/fixtures/query-extraction.json
new file mode 100644
index 0000000..25cdcce
--- /dev/null
+++ b/fixtures/query-extraction.json
@@ -0,0 +1,22 @@
+{
+  "version": 1,
+  "domain": "query",
+  "description": "Page text / title -> canonical JAV ID. Consumed by the browser extension (content.js normalizeId). Difference from filename: looser context (sentences, mixed punctuation, site chrome). Includes forms (e.g. FC2PPV compact) that Python extract_id does NOT handle, by design — see fixtures/README.md.",
+  "case_schema": {
+    "name": "human label",
+    "input": "raw page text",
+    "expected": "canonical ID without part suffix (extension never emits #partN), or null when no ID found"
+  },
+  "cases": [
+    { "name": "title with site chrome",                "input": "SSIS-001 — JAV.tube",                                     "expected": "SSIS-001" },
+    { "name": "title with description",                "input": "Watch SSIS-001 1080p HD Online",                          "expected": "SSIS-001" },
+    { "name": "trailing letter variant",               "input": "IBW-902z Full Movie",                                     "expected": "IBW-902" },
+    { "name": "no hyphen in title",                    "input": "MVSD312 stream",                                          "expected": "MVSD-312" },
+    { "name": "FC2 PPV compact",                       "input": "FC2PPV-1841460 — preview",                                "expected": "FC2-PPV-1841460" },
+    { "name": "FC2 plain digits",                      "input": "FC2-1841460 thumbnail",                                   "expected": "FC2-PPV-1841460" },
+    { "name": "FC2-PPV explicit",                      "input": "FC2-PPV-1841460 Full",                                    "expected": "FC2-PPV-1841460" },
+    { "name": "leading zeros preserved",               "input": "ABF-042 — sample",                                        "expected": "ABF-042" },
+    { "name": "long numeric tail (7 digits)",          "input": "BLK-4748520 stream",                                      "expected": "BLK-4748520" },
+    { "name": "no ID present",                         "input": "JAV Database · home",                                     "expected": null }
+  ]
+}
diff --git a/fixtures/run.py b/fixtures/run.py
new file mode 100644
index 0000000..3f97e68
--- /dev/null
+++ b/fixtures/run.py
@@ -0,0 +1,70 @@
+"""Run the shared JAV-ID fixture corpus against rc-jav.py.
+
+Exits non-zero if any fixture case fails. No third-party dependencies.
+
+Usage:
+    python fixtures/run.py
+"""
+from __future__ import annotations
+
+import importlib.util
+import json
+import sys
+from pathlib import Path
+
+ROOT = Path(__file__).resolve().parents[1]
+FIXTURES = Path(__file__).resolve().parent
+
+SPEC = importlib.util.spec_from_file_location("rcjav", ROOT / "rc-jav.py")
+RCJAV = importlib.util.module_from_spec(SPEC)
+sys.modules[SPEC.name] = RCJAV
+SPEC.loader.exec_module(RCJAV)
+
+
+def _load(name: str) -> dict:
+    with (FIXTURES / name).open("r", encoding="utf-8") as f:
+        return json.load(f)
+
+
+def _run(label: str, cases: list[dict], fn) -> tuple[int, int]:
+    passed = 0
+    failed = 0
+    for case in cases:
+        got = fn(case["input"])
+        if got == case["expected"]:
+            passed += 1
+        else:
+            failed += 1
+            print(f"  FAIL [{label}] {case['name']!r}")
+            print(f"        input    = {case['input']!r}")
+            print(f"        expected = {case['expected']!r}")
+            print(f"        got      = {got!r}")
+    return passed, failed
+
+
+def main() -> int:
+    total_passed = 0
+    total_failed = 0
+
+    for filename, fn_name, fn in [
+        ("filename-extraction.json", "extract_id", RCJAV.extract_id),
+        ("shared-normalization.json", "normalize_id", RCJAV.normalize_id),
+    ]:
+        doc = _load(filename)
+        cases = doc.get("cases", [])
+        print(f"\n{filename}  ->  rcjav.{fn_name}  ({len(cases)} cases)")
+        p, f = _run(filename, cases, fn)
+        total_passed += p
+        total_failed += f
+        print(f"  {p} passed | {f} failed")
+
+    print()
+    if total_failed:
+        print(f"FAILED: {total_failed} of {total_passed + total_failed} cases")
+        return 1
+    print(f"OK: all {total_passed} cases passed")
+    return 0
+
+
+if __name__ == "__main__":
+    sys.exit(main())
diff --git a/fixtures/shared-normalization.json b/fixtures/shared-normalization.json
new file mode 100644
index 0000000..7880f5b
--- /dev/null
+++ b/fixtures/shared-normalization.json
@@ -0,0 +1,17 @@
+{
+  "version": 1,
+  "domain": "shared",
+  "description": "Raw ID forms → canonical form. Both Python (normalize_id) and the extension (content.js normalizeId) MUST agree on these. Mismatch here is a contract bug.",
+  "case_schema": {
+    "name": "human label",
+    "input": "raw ID-bearing token (no path, no extension)",
+    "expected": "canonical ID"
+  },
+  "cases": [
+    { "name": "lowercase prefix uppercased",           "input": "abc-027",         "expected": "ABC-027" },
+    { "name": "FC2 plain -> FC2-PPV",                  "input": "FC2-1841460",     "expected": "FC2-PPV-1841460" },
+    { "name": "FC2-PPV explicit preserved",            "input": "FC2-PPV-1841460", "expected": "FC2-PPV-1841460" },
+    { "name": "leading zeros preserved",               "input": "ABF-042",         "expected": "ABF-042" },
+    { "name": "5-digit numeric segment",               "input": "SDDE-12345",      "expected": "SDDE-12345" }
+  ]
+}
diff --git a/mockups/console-consolidation-claude.html b/mockups/console-consolidation-claude.html
new file mode 100644
index 0000000..05ed4c8
--- /dev/null
+++ b/mockups/console-consolidation-claude.html
@@ -0,0 +1,695 @@
+<!doctype html>
+<html>
+<head>
+  <meta charset="utf-8">
+  <title>rclone-jav consolidation — final converged plan</title>
+  <style>
+    :root {
+      color-scheme: dark;
+      --bg: #0c0e10;
+      --shell: #14171a;
+      --panel: #181b1e;
+      --surface: #1f2327;
+      --line: #292e33;
+      --line-2: #3a4148;
+      --text: #e1e6eb;
+      --muted: #8a949d;
+      --blue: #6ec5ff;
+      --green: #7de4a0;
+      --yellow: #ffd36c;
+      --red: #ff9097;
+      --purple: #c5a9ff;
+      --orange: #ffb072;
+    }
+    * { box-sizing: border-box; }
+    body { margin:0; background:var(--bg); color:var(--text); font:13px/1.5 -apple-system,BlinkMacSystemFont,"Segoe UI",sans-serif; }
+    main { padding:24px; max-width:1380px; margin:0 auto; }
+    h1 { margin:0 0 4px; font-size:24px; }
+    h2 { margin:24px 0 8px; font-size:17px; color:#f4f7fa; }
+    h3 { margin:0 0 6px; font-size:11px; text-transform:uppercase; color:#9ba6af; letter-spacing:0.04em; }
+    p { margin:0; }
+    .intro { color:var(--muted); max-width:960px; margin:6px 0 18px; font-size:13px; }
+    .meta-banner { display:flex; align-items:center; gap:10px; padding:10px 14px; background:#11181f; border:1px solid #1f2b35; border-radius:6px; margin-bottom:18px; font-size:12px; color:var(--muted); }
+    .meta-banner .dot { width:8px; height:8px; border-radius:50%; background:var(--green); box-shadow:0 0 0 3px rgba(125,228,160,0.15); }
+    .meta-banner b { color:#cfdde5; }
+
+    .status-grid { display:grid; grid-template-columns:repeat(3,minmax(0,1fr)); gap:12px; margin-bottom:24px; }
+    .status-card { background:#13171b; border:1px solid #232a30; border-radius:6px; padding:12px; }
+    .status-card h3 { color:#dce5ed; text-transform:none; letter-spacing:0; font-size:13px; margin-bottom:8px; }
+    .status-card.done { border-left:3px solid var(--green); }
+    .status-card.todo { border-left:3px solid var(--yellow); }
+    .status-card.work { border-left:3px solid var(--blue); }
+    .status-card ul { margin:0; padding-left:16px; color:var(--muted); font-size:12px; }
+    .status-card ul li { margin:2px 0; }
+    .status-card ul li b { color:#dce5ed; font-weight:600; }
+
+    .legend { display:flex; gap:6px; flex-wrap:wrap; margin-bottom:14px; }
+    .pill { border-radius:12px; padding:3px 9px; font-size:11px; border:1px solid var(--line-2); background:#22272b; color:var(--text); }
+    .pill.keep { color:var(--green); background:#143020; border-color:#245036; }
+    .pill.move { color:var(--blue); background:#132837; border-color:#284b66; }
+    .pill.del  { color:var(--red); background:#321618; border-color:#5b2228; }
+    .pill.debug{ color:var(--purple); background:#241d35; border-color:#453363; }
+    .pill.warn { color:var(--yellow); background:#332b16; border-color:#645228; }
+    .pill.ctx  { color:var(--orange); background:#3a2818; border-color:#7a4b25; }
+
+    .mock { border:1px solid #2c333a; border-radius:8px; background:var(--shell); overflow:hidden; }
+    .top { display:flex; align-items:center; justify-content:space-between; padding:11px 14px; border-bottom:1px solid var(--line); background:#0f1214; }
+    .brand { font-weight:700; color:#fff; font-size:14px; letter-spacing:0.01em; }
+    .toolbar { display:flex; gap:6px; align-items:center; }
+    button { border:1px solid var(--line-2); border-radius:4px; padding:5px 10px; background:#252a2e; color:var(--text); font:inherit; cursor:default; }
+    button.primary { background:#163923; color:#aaf3bf; border-color:#285b3a; }
+    button.live { background:#143247; color:#9fd9ff; border-color:#2e607f; }
+    button.danger { background:#3a191d; color:#ffb2b7; border-color:#722c33; }
+    button.ghost { background:transparent; color:#9aa4ac; border-color:#3a4148; }
+
+    .layout { display:grid; grid-template-columns: 200px minmax(0,1fr); min-height:480px; }
+    .side { background:#0d1013; border-right:1px solid var(--line); padding:14px 12px; }
+    .grp { margin-bottom:16px; }
+    .gtitle { color:#5e6970; text-transform:uppercase; letter-spacing:0.06em; font-size:10px; margin:0 0 6px; padding-left:6px; }
+    .nav { display:grid; gap:2px; }
+    .nav a { display:flex; align-items:center; justify-content:space-between; padding:6px 8px; border-radius:4px; color:#b3bdc4; text-decoration:none; gap:6px; }
+    .nav a.active { background:#27313a; color:#fff; box-shadow:inset 2px 0 var(--blue); }
+    .nav a:hover:not(.active) { background:#1a1f24; }
+    .nav .badge { font-size:10px; padding:1px 6px; border-radius:9px; background:#2d343a; color:#a7b2bb; }
+    .nav .badge.warn { background:#3a3017; color:#ffd784; }
+    .nav .badge.fresh{ background:#1d3826; color:#9be3b3; }
+
+    .content { padding:18px 20px; min-width:0; }
+    .heading { display:flex; align-items:flex-start; justify-content:space-between; gap:10px; margin-bottom:14px; }
+    .heading .desc { color:var(--muted); font-size:12px; margin-top:3px; }
+    .row-actions { display:flex; gap:6px; }
+
+    .sub-tabs { display:flex; gap:0; border-bottom:1px solid var(--line); margin-bottom:14px; }
+    .sub-tabs span { padding:8px 14px; color:#8b95a0; font-size:12px; cursor:default; border-bottom:2px solid transparent; }
+    .sub-tabs span.active { color:#fff; border-bottom-color: var(--blue); }
+
+    .grid2 { display:grid; grid-template-columns: repeat(2, minmax(0,1fr)); gap:10px; }
+    .grid3 { display:grid; grid-template-columns: repeat(3, minmax(0,1fr)); gap:10px; }
+
+    .card { background:var(--panel); border:1px solid var(--line); border-radius:6px; padding:12px; min-width:0; }
+    .card .meta { color:var(--muted); font-size:11px; margin-top:4px; }
+    .card .metric { font-size:18px; color:#fff; font-weight:600; }
+
+    .dup-list { display:grid; gap:6px; margin-top:8px; }
+    .dup-row { display:grid; grid-template-columns: 1fr auto auto; align-items:center; gap:8px; padding:8px 10px; background:#141a1e; border:1px solid #232a30; border-radius:4px; }
+    .dup-row .path { font:12px Consolas, monospace; color:#cdd6dd; overflow:hidden; text-overflow:ellipsis; white-space:nowrap; }
+    .dup-row .size { font-size:11px; color:#8a949d; }
+    .keep-pill { font-size:10px; padding:1px 7px; border-radius:9px; background:#143b22; color:#9be3b3; border:1px solid #245036; }
+    .review-pill { font-size:10px; padding:1px 7px; border-radius:9px; background:#332b16; color:#ffd784; border:1px solid #645228; }
+
+    /* Decision table */
+    table.spec { width:100%; border-collapse:collapse; margin-top:10px; font-size:12px; }
+    table.spec th { text-align:left; padding:8px 10px; background:#181d22; color:#cfdde5; font-weight:600; border-bottom:1px solid #2a3138; }
+    table.spec td { padding:9px 10px; border-bottom:1px solid #1c2126; color:var(--text); vertical-align:top; }
+    table.spec tr:nth-child(even) td { background:#10141a; }
+    table.spec td.order { font-family:Consolas,monospace; color:var(--blue); font-weight:600; }
+    table.spec td.surface { color:#dce5ed; }
+    table.spec td .pill { font-size:10px; }
+    table.spec td .small { color:var(--muted); font-size:11px; display:block; margin-top:2px; }
+
+    /* Popup launcher mock */
+    .popup-mock { background:#0e1114; border:1px dashed #394149; border-radius:6px; padding:18px; display:grid; place-items:center; }
+    .popup-frame { width:340px; border:1px solid var(--line-2); border-radius:6px; background:#181b1e; padding:12px; box-shadow:0 6px 18px rgba(0,0,0,.4); }
+    .popup-frame .ptop { display:flex; justify-content:space-between; align-items:center; margin-bottom:8px; }
+    .popup-frame input { width:100%; background:#0a0c0e; border:1px solid #313840; border-radius:3px; padding:6px 8px; color:var(--text); font:12px Consolas,monospace; }
+    .popup-frame .pchips { display:flex; gap:5px; flex-wrap:wrap; margin-top:8px; }
+    .annot { color:var(--muted); font-size:11px; margin-top:10px; font-style:italic; }
+
+    /* Checklist */
+    .checklist { background:#13171b; border:1px solid #232a30; border-radius:6px; padding:14px; margin-top:10px; }
+    .checklist h3 { color:#dce5ed; text-transform:none; letter-spacing:0; font-size:13px; margin-bottom:8px; }
+    .checkrow { display:grid; grid-template-columns: 22px 1fr auto; gap:8px; padding:7px 0; border-top:1px solid #1c2126; align-items:start; }
+    .checkrow:first-of-type { border-top:0; }
+    .checkrow .box { width:14px; height:14px; border:1px solid #4a5560; border-radius:3px; margin-top:3px; background:#0a0c0e; }
+    .checkrow .what { color:var(--text); font-size:12px; }
+    .checkrow .what .small { color:var(--muted); font-size:11px; }
+    .checkrow .who { color:#9aa4ac; font-size:11px; font-style:italic; }
+
+    /* Decisions / sub-cards */
+    .dec { background:#13171b; border:1px solid #232a30; border-radius:7px; padding:14px; }
+    .dec-head { display:flex; align-items:center; justify-content:space-between; gap:8px; margin-bottom:8px; }
+    .dec-head h3 { color:#dce5ed; text-transform:none; font-size:13px; letter-spacing:0; margin:0; }
+    .dec-verdict { color:#a8b3bb; font-size:12px; margin-top:8px; }
+    .dec-verdict b { color:#ddebf3; }
+    .decisions-2 { display:grid; grid-template-columns: 1fr 1fr; gap:12px; margin-top:10px; }
+
+    /* Sequence */
+    .seq-list { display:grid; gap:6px; margin-top:10px; }
+    .seq-list .step { display:grid; grid-template-columns: 30px 1fr auto auto; gap:10px; padding:9px 12px; background:#13171b; border:1px solid #232a30; border-radius:5px; align-items:center; }
+    .seq-list .num { width:24px; height:24px; border-radius:50%; background:#18354a; color:var(--blue); display:grid; place-items:center; font-weight:700; font-size:11px; }
+    .seq-list .why { color:var(--muted); font-size:11px; }
+    .seq-list .risk { font-size:10px; padding:2px 7px; border-radius:8px; }
+    .seq-list .risk.low { color:#9be3b3; background:#0f2218; border:1px solid #1e3b27; }
+    .seq-list .risk.med { color:#ffd784; background:#231d10; border:1px solid #3d3018; }
+    .seq-list .risk.high { color:#ffb2b7; background:#2a1216; border:1px solid #4a1f25; }
+    .seq-list .deps { font-size:10px; color:#7a838c; font-family:Consolas,monospace; }
+
+    code { font-family:Consolas, monospace; background:#1a1f24; padding:1px 5px; border-radius:3px; color:#cfdde5; }
+    .strike { text-decoration:line-through; color:#6b757d; }
+
+    @media (max-width: 900px) {
+      .layout { grid-template-columns: 1fr; }
+      .side { border-right:0; border-bottom:1px solid var(--line); }
+      .grid2, .grid3, .decisions-2, .status-grid { grid-template-columns: 1fr; }
+    }
+  </style>
+</head>
+<body>
+<main>
+  <h1>rclone-jav Consolidation — Final Converged Plan</h1>
+  <div class="meta-banner">
+    <span class="dot"></span>
+    <span><b>Status:</b> execution in progress. <b>Shipped:</b> steps 1 (Sim Dupe delete), 2 (CSS extraction), 3 (Transfer Assistant delete + Diagnostics replacement), 5 (Recent Activity + Search Troubleshooting → new Debug Tools pane). <b>Pending:</b> steps 6 (options.js split — Cache & Dup Review paired, biggest), 7a (Bulk Check standalone window), 8 (fixtures), 9 (cache contract), 10 (rc-jav.py split), 11 (host fast-path decision). See <code>D:\DEV\Extensions\Production\rclone-jav\AGENTS.md</code> "Console consolidation refactor — execution status" for current state.</span>
+  </div>
+
+  <div class="status-grid">
+    <div class="status-card done">
+      <h3>✓ Decided</h3>
+      <ul>
+        <li>Console / Settings / Support tri-split</li>
+        <li>Default landing = <b>Duplicate Review</b></li>
+        <li>Status badges on tabs, <b>no dashboard pane</b></li>
+        <li>Launcher pattern over toolbox</li>
+        <li>Keep Ranking nested in Dup Review</li>
+        <li>Sim Dupe → <b>delete</b>, samples/ HTML harness</li>
+        <li>Transfer wizard → <b>delete</b> after Diagnostics replacement verified</li>
+        <li>Bulk ID Check → <b>detached chrome.windows popup</b>, NOT a Console sidebar tab</li>
+        <li>Inline rule tests stay, standalone benches → Debug</li>
+      </ul>
+    </div>
+    <div class="status-card done">
+      <h3>✓ Shipped</h3>
+      <ul>
+        <li><b>Step 1:</b> Sim Dupe deleted from popup. <code>samples/sim-dupe.js</code> preserves payload.</li>
+        <li><b>Step 2:</b> CSS extracted → <code>options.css</code>. options.html 1179 → 794 lines.</li>
+        <li><b>Step 3:</b> Transfer wizard deleted. Diagnostics → Native host registration now shows Extension ID + Copy button.</li>
+        <li><b>Step 5:</b> Recent Activity + Search Troubleshooting moved to new Debug Tools pane. Scope verified by code read.</li>
+      </ul>
+    </div>
+    <div class="status-card work">
+      <h3>📋 Pending</h3>
+      <ul>
+        <li><b>Step 6:</b> options.js split (Cache + Dup Review paired). 3133-line file. Biggest, riskiest.</li>
+        <li><b>Step 7a:</b> bulk-check.html standalone + popup launcher.</li>
+        <li><b>Steps 8–10:</b> fixtures, cache contract, rc-jav.py split.</li>
+        <li><b>Step 11:</b> host fast-path benchmark + narrow/delete decision.</li>
+      </ul>
+    </div>
+  </div>
+
+  <!-- ====================================================== -->
+  <h2>1. Primary recommended layout</h2>
+  <p class="intro">Default landing = Duplicate Review (user's most-frequent maintenance workflow). Sidebar tab labels carry live status badges — no dashboard pane needed. Launcher pattern: heavy tools open focused panes, not nested fieldsets.</p>
+
+  <div class="mock">
+    <div class="top">
+      <span class="brand">rclone-jav</span>
+      <div class="toolbar">
+        <button>Profile: cq:JAV</button>
+        <button class="ghost">⚙</button>
+      </div>
+    </div>
+    <div class="layout">
+      <aside class="side">
+        <div class="grp">
+          <div class="gtitle">Console</div>
+          <div class="nav">
+            <a href="#" class="active">Duplicate Review<span class="badge warn">27</span></a>
+            <a href="#">Cache &amp; Scans<span class="badge fresh">28m</span></a>
+            <a href="#">Library Issues<span class="badge">4</span></a>
+          </div>
+          <p style="color:#5e6970; font-size:10px; margin:6px 0 0 6px; font-style:italic;">Bulk Check lives in its own window — popup launcher, not sidebar.</p>
+        </div>
+        <div class="grp">
+          <div class="gtitle">Settings</div>
+          <div class="nav">
+            <a href="#">Profiles</a>
+            <a href="#">Scan Behavior</a>
+            <a href="#">Matching Rules</a>
+            <a href="#">Site Extraction</a>
+            <a href="#">Overlays</a>
+            <a href="#">Deletion</a>
+          </div>
+        </div>
+        <div class="grp">
+          <div class="gtitle">Support</div>
+          <div class="nav">
+            <a href="#">Diagnostics</a>
+            <a href="#">Debug Tools</a>
+          </div>
+        </div>
+      </aside>
+      <div class="content">
+        <div class="heading">
+          <div>
+            <h2 style="margin-top:0;">Duplicate Review <span class="pill warn" style="margin-left:6px;">27 pending</span></h2>
+            <p class="desc">After-upload workflow. Risky groups skipped by default. Keep Ranking lives here as configuration, not in a separate Settings tab.</p>
+          </div>
+          <div class="row-actions">
+            <button>Re-scan</button>
+            <button class="primary">Run Delete Queue (12)</button>
+          </div>
+        </div>
+
+        <div class="sub-tabs">
+          <span class="active">Pending Review</span>
+          <span>Skipped — Risky</span>
+          <span>Keep Ranking Rules</span>
+          <span>Delete History</span>
+        </div>
+
+        <div class="grid2">
+          <div class="card">
+            <h3>Filter (this tool only)</h3>
+            <div class="row-actions" style="margin-top:6px; flex-wrap:wrap;">
+              <button class="ghost">Multipart only</button>
+              <button class="ghost">VIP collision</button>
+              <button class="ghost">Size diff &gt; 100MB</button>
+            </div>
+            <p class="meta">Filters scoped — never exported as global settings.</p>
+          </div>
+          <div class="card">
+            <h3>Delete queue</h3>
+            <div class="metric">12 files · 47.3 GiB</div>
+            <p class="meta">Safety: VIP folders + multipart-risk paths auto-excluded.</p>
+          </div>
+        </div>
+
+        <div style="margin-top:12px;">
+          <h3>JBD-291 · 2 candidates</h3>
+          <div class="dup-list">
+            <div class="dup-row">
+              <span class="path">/JAV/clearjav/JBD-291 [1080p].mp4</span>
+              <span class="size">4.94 GiB</span>
+              <span class="keep-pill">KEEP</span>
+            </div>
+            <div class="dup-row">
+              <span class="path">/JAV/old/JBD-291.mp4</span>
+              <span class="size">3.82 GiB</span>
+              <button class="danger" style="padding:2px 8px; font-size:11px;">Queue delete</button>
+            </div>
+          </div>
+        </div>
+
+        <div style="margin-top:14px;">
+          <h3>OFJE-195 · multipart risk</h3>
+          <div class="dup-list">
+            <div class="dup-row">
+              <span class="path">/JAV/OFJE-195_PART1.mp4</span>
+              <span class="size">2.10 GiB</span>
+              <span class="review-pill">REVIEW</span>
+            </div>
+            <div class="dup-row">
+              <span class="path">/JAV/OFJE-195_PART2.mp4</span>
+              <span class="size">2.08 GiB</span>
+              <span class="review-pill">REVIEW</span>
+            </div>
+          </div>
+        </div>
+      </div>
+    </div>
+  </div>
+
+  <!-- ====================================================== -->
+  <h2>2. Decision table (refactor spec data)</h2>
+  <p class="intro">Each current pane mapped to its future home, treatment, ship order, and replacement work (if any). Ship order = execution sequence within phase 3 (UI consolidation). Steps share PR scope where useful.</p>
+
+  <div class="legend">
+    <span class="pill keep">KEEP visible</span>
+    <span class="pill ctx">CONTEXTUAL (lives with feature)</span>
+    <span class="pill move">MOVE (relocate)</span>
+    <span class="pill debug">DEBUG only</span>
+    <span class="pill del">DELETE</span>
+  </div>
+
+  <table class="spec">
+    <thead>
+      <tr>
+        <th style="width:42px;">#</th>
+        <th>Current surface</th>
+        <th>Future home</th>
+        <th>Treatment</th>
+        <th>Replacement</th>
+      </tr>
+    </thead>
+    <tbody>
+      <tr>
+        <td class="order">1</td>
+        <td class="surface">Sim Dupe popup action</td>
+        <td><code>samples/popup-states.html</code> (repo file)</td>
+        <td><span class="pill del">DELETE</span></td>
+        <td><span class="small">No product replacement. Repo HTML for layout testing only.</span></td>
+      </tr>
+      <tr>
+        <td class="order">2</td>
+        <td class="surface">CSS embedded in options.html</td>
+        <td>Per-pane <code>.css</code> files alongside per-pane JS</td>
+        <td><span class="pill move">EXTRACT</span></td>
+        <td><span class="small">No behavior change. Reduces options.html before JS split.</span></td>
+      </tr>
+      <tr>
+        <td class="order">3</td>
+        <td class="surface">Transfer Assistant wizard</td>
+        <td>(gone)</td>
+        <td><span class="pill del">DELETE</span></td>
+        <td><span class="small">Replacement = Diagnostics 3 actions (see §3 checklist). Delete <em>after</em> verification.</span></td>
+      </tr>
+      <tr>
+        <td class="order">4</td>
+        <td class="surface">Cache &amp; Scans pane</td>
+        <td>Console → Cache &amp; Scans</td>
+        <td><span class="pill keep">KEEP</span></td>
+        <td><span class="small">Paired with Dup Review extraction. State interface shared.</span></td>
+      </tr>
+      <tr>
+        <td class="order">4</td>
+        <td class="surface">Duplicate Review pane</td>
+        <td>Console → Duplicate Review <em>(default landing)</em></td>
+        <td><span class="pill keep">KEEP</span></td>
+        <td><span class="small">Same PR as Cache &amp; Scans. Reads cache state.</span></td>
+      </tr>
+      <tr>
+        <td class="order">4</td>
+        <td class="surface">Keep Ranking Rules pane</td>
+        <td>Duplicate Review → Keep Ranking Rules <em>(sub-tab)</em></td>
+        <td><span class="pill ctx">CONTEXTUAL</span></td>
+        <td><span class="small">Moves with Dup Review. Becomes nested sub-tab.</span></td>
+      </tr>
+      <tr>
+        <td class="order">4</td>
+        <td class="surface">VIP folders config</td>
+        <td>Duplicate Review → Keep Ranking Rules</td>
+        <td><span class="pill ctx">CONTEXTUAL</span></td>
+        <td><span class="small">Feature-specific config moves with feature.</span></td>
+      </tr>
+      <tr>
+        <td class="order">5</td>
+        <td class="surface">Recent Activity (search/page history)</td>
+        <td>Support → Debug Tools → Search Activity</td>
+        <td><span class="pill debug">DEBUG</span></td>
+        <td><span class="small">If audit deletion events also present, split out (pending verification).</span></td>
+      </tr>
+      <tr>
+        <td class="order">5</td>
+        <td class="surface">Search Troubleshooting</td>
+        <td>Support → Debug Tools</td>
+        <td><span class="pill debug">DEBUG</span></td>
+        <td><span class="small">Standalone bench. No edit locality.</span></td>
+      </tr>
+      <tr>
+        <td class="order">5</td>
+        <td class="surface">Page Extraction Test (standalone)</td>
+        <td>Support → Debug Tools</td>
+        <td><span class="pill debug">DEBUG</span></td>
+        <td><span class="small">Inline "Pick Element" variant stays in Site Extraction settings.</span></td>
+      </tr>
+      <tr>
+        <td class="order">5</td>
+        <td class="surface">Test ID Extraction (inline)</td>
+        <td>Settings → Matching Rules (collapsible per editor)</td>
+        <td><span class="pill ctx">CONTEXTUAL</span></td>
+        <td><span class="small">Editor feedback. Stays beside rule it tests.</span></td>
+      </tr>
+      <tr>
+        <td class="order">5</td>
+        <td class="surface">Test ID Extraction (standalone bench)</td>
+        <td>Support → Debug Tools</td>
+        <td><span class="pill debug">DEBUG</span></td>
+        <td><span class="small">Second row — split from inline version above.</span></td>
+      </tr>
+      <tr>
+        <td class="order">6</td>
+        <td class="surface">Library Issues pane</td>
+        <td>Console → Library Issues</td>
+        <td><span class="pill keep">KEEP</span></td>
+        <td><span class="small">Own tab + status badge. Rename UI nested as sub-tab.</span></td>
+      </tr>
+      <tr>
+        <td class="order">6</td>
+        <td class="surface">Bulk ID Check</td>
+        <td><code>bulk-check.html</code> — detached <code>chrome.windows</code> popup</td>
+        <td><span class="pill move">RESHAPE</span></td>
+        <td><span class="small">Removed from Console sidebar. Single entry path = popup launcher button → opens 640×540 detached window. Different tool type than Console panes (transient utility, no sidebar context).</span></td>
+      </tr>
+      <tr>
+        <td class="order">7</td>
+        <td class="surface">Profiles, Scan Behavior, Overlays, Deletion settings</td>
+        <td>Settings → (separate sub-tabs)</td>
+        <td><span class="pill keep">KEEP</span></td>
+        <td><span class="small">Settings sub-tabs split into separate JS files.</span></td>
+      </tr>
+      <tr>
+        <td class="order">7</td>
+        <td class="surface">Matching Rules / Site Extraction</td>
+        <td>Settings → (separate sub-tabs, inline tests retained)</td>
+        <td><span class="pill keep">KEEP</span></td>
+        <td><span class="small">Collapsible inline tester beside each rule.</span></td>
+      </tr>
+      <tr>
+        <td class="order">8</td>
+        <td class="surface">(new) Shared fixture corpus</td>
+        <td>Top-level <code>fixtures/</code> (neutral location)</td>
+        <td><span class="pill move">NEW</span></td>
+        <td><span class="small">Contract between extension and Python. Both consume.</span></td>
+      </tr>
+      <tr>
+        <td class="order">9</td>
+        <td class="surface">Cache contract design</td>
+        <td>CACHE_VERSION (exists) + ID_RULES_VERSION (new)</td>
+        <td><span class="pill move">NEW</span></td>
+        <td><span class="small">Schema bump = force rebuild. Rules bump = warn-and-mark-stale.</span></td>
+      </tr>
+      <tr>
+        <td class="order">10</td>
+        <td class="surface">rc-jav.py monolith</td>
+        <td><code>rcjav/</code> package (ids, cache, dupes, catalog, …)</td>
+        <td><span class="pill move">SPLIT</span></td>
+        <td><span class="small">After fixtures + tests + cache contract exist.</span></td>
+      </tr>
+      <tr>
+        <td class="order">11</td>
+        <td class="surface">Host fast-path search</td>
+        <td>Narrow / Delete / Keep — based on §4 benchmark</td>
+        <td><span class="pill warn">DECIDE</span></td>
+        <td><span class="small">Benchmark idle + under-scan latency first.</span></td>
+      </tr>
+    </tbody>
+  </table>
+
+  <!-- ====================================================== -->
+  <h2>3. Pre-execution checklists (user handoffs)</h2>
+
+  <div class="decisions-2">
+    <div class="checklist">
+      <h3>Diagnostics replacement verification (gates step 3 — Transfer wizard delete)</h3>
+      <div class="checkrow"><span class="box"></span><span class="what">Current extension ID shown as one-line text with copy-to-clipboard button<div class="small">Replaces wizard's "your extension ID is…" step.</div></span><span class="who">user opens<br>Diagnostics</span></div>
+      <div class="checkrow"><span class="box"></span><span class="what">Button labeled "Re-register host" that triggers register-host.bat path<div class="small">Replaces wizard's "run this script" step.</div></span><span class="who">user opens<br>Diagnostics</span></div>
+      <div class="checkrow"><span class="box"></span><span class="what">Verification result shown inline within 2s of register click<div class="small">Replaces wizard's "now check the result" step.</div></span><span class="who">user opens<br>Diagnostics</span></div>
+      <div class="checkrow"><span class="box"></span><span class="what">All three above visible without expanding collapsed sections (one screen)<div class="small">If buried in expandable cards, write better UI first.</div></span><span class="who">visual<br>inspection</span></div>
+    </div>
+
+    <div class="checklist">
+      <h3>Recent Activity scope test (settles split question)</h3>
+      <div class="checkrow"><span class="box"></span><span class="what">Open Recent Activity. Note current entry types visible.<div class="small">LIVE search, CACHE search, MATCH, NO_MATCH, NO_ID, page-check, etc.</div></span><span class="who">user</span></div>
+      <div class="checkrow"><span class="box"></span><span class="what">Perform a delete in Duplicate Review. Refresh Recent Activity.<div class="small">Single delete operation, any candidate.</div></span><span class="who">user</span></div>
+      <div class="checkrow"><span class="box"></span><span class="what">If delete event appears → audit value exists. Split into Dup Review → Delete History.<div class="small">If no → single role. Move entire log to Debug Tools.</div></span><span class="who">user reports</span></div>
+    </div>
+  </div>
+
+  <p class="annot">Cosmetic remaining: popup launcher button label "Bulk Check" vs icon-only. Either works. Default to label until popup row gets crowded.</p>
+
+  <!-- ====================================================== -->
+  <h2>4. Bulk Check — detached window pattern</h2>
+  <p class="intro">User clarified: Bulk Check is a transient utility, not a persistent Console surface. Doesn't fit sidebar-tab pattern alongside Dup Review / Cache &amp; Scans / Library Issues. Decision: standalone <code>bulk-check.html</code> opened as detached <code>chrome.windows</code> popup, no Console sidebar entry. Single canonical entry path = popup launcher button.</p>
+
+  <div class="grid2" style="margin-top:14px;">
+    <div>
+      <h3 style="text-transform:none; letter-spacing:0; font-size:13px; color:#dce5ed; margin-bottom:8px;">Browser-action popup with launcher</h3>
+      <div class="popup-mock">
+        <div class="popup-frame">
+          <div class="ptop">
+            <b style="color:#fff; font-size:13px;">rclone-jav</b>
+            <button class="ghost" style="padding:2px 8px; font-size:11px;">⚙</button>
+          </div>
+          <input value="BLK-474" />
+          <div class="pchips">
+            <button class="primary" style="padding:3px 10px; font-size:11px;">Search</button>
+            <button class="live" style="padding:3px 10px; font-size:11px;">📋 Bulk Check…</button>
+            <button class="ghost" style="padding:3px 10px; font-size:11px;">⏸</button>
+          </div>
+          <div class="annot" style="margin-top:10px;">Single-search stays primary. Bulk button = one click to detached window.</div>
+        </div>
+      </div>
+    </div>
+
+    <div>
+      <h3 style="text-transform:none; letter-spacing:0; font-size:13px; color:#dce5ed; margin-bottom:8px;">Detached window (640×540) after launch</h3>
+      <div class="popup-mock" style="padding:10px;">
+        <div style="width:480px; max-width:100%; background:#181b1e; border:1px solid var(--line-2); border-radius:6px; box-shadow:0 8px 24px rgba(0,0,0,.5); overflow:hidden;">
+          <div style="display:flex; justify-content:space-between; align-items:center; background:#0f1214; border-bottom:1px solid var(--line); padding:8px 12px;">
+            <b style="color:#fff; font-size:13px;">Bulk ID Check</b>
+            <div style="display:flex; gap:4px;">
+              <button class="ghost" style="padding:2px 7px; font-size:11px;">_</button>
+              <button class="ghost" style="padding:2px 7px; font-size:11px;">□</button>
+              <button class="ghost" style="padding:2px 7px; font-size:11px;">×</button>
+            </div>
+          </div>
+          <div style="padding:12px;">
+            <textarea style="width:100%; height:90px; background:#0a0c0e; border:1px solid #313840; border-radius:3px; padding:7px 9px; color:var(--text); font:12px Consolas,monospace; resize:vertical;">BLK-474
+FC2-PPV-1841460
+KV-118
+PRTD-029
+JBD-291</textarea>
+            <div class="row-actions" style="margin-top:8px;">
+              <button class="primary" style="font-size:12px;">Check 5 IDs</button>
+              <button style="font-size:12px;">Clear</button>
+              <button class="ghost" style="font-size:12px;">Import .txt…</button>
+            </div>
+            <div style="margin-top:12px; padding:8px 10px; background:#0f1518; border:1px solid #1d2a30; border-radius:4px; font-size:11px; color:var(--muted);">
+              5 IDs checked · <span style="color:#9be3b3;">3 match</span> · <span style="color:#ffd784;">2 no match</span>
+            </div>
+            <div class="dup-list" style="margin-top:8px;">
+              <div class="dup-row" style="padding:6px 8px;"><span class="path">BLK-474</span><span class="size">4.94 GiB</span><span class="keep-pill">MATCH</span></div>
+              <div class="dup-row" style="padding:6px 8px;"><span class="path">KV-118</span><span class="size">multi-part</span><span class="keep-pill">MATCH</span></div>
+              <div class="dup-row" style="padding:6px 8px;"><span class="path">PRTD-029</span><span class="size">—</span><span class="review-pill">NO MATCH</span></div>
+            </div>
+          </div>
+        </div>
+      </div>
+      <p class="annot">Detached window. No tab bar, no address bar. Closes cleanly when done. Sits over browser, stays visible across tab switches.</p>
+    </div>
+  </div>
+
+  <div class="card" style="background:#13171b; border:1px solid #232a30; margin-top:14px;">
+    <h3 style="color:#dce5ed; text-transform:none; letter-spacing:0; font-size:13px;">Why detached window, not Console tab</h3>
+    <div class="grid2" style="margin-top:8px;">
+      <div>
+        <p class="meta" style="font-size:11px;"><b style="color:#cfdde5;">Other Console tools (Dup Review, Cache &amp; Scans, Library Issues):</b></p>
+        <ul style="color:var(--muted); font-size:11px; margin:6px 0 0 16px; padding:0;">
+          <li>long workflows, multi-pass</li>
+          <li>need sidebar context (compare to other tools)</li>
+          <li>persistent state (review queue, scan job)</li>
+          <li>fit Options sidebar tab pattern</li>
+        </ul>
+      </div>
+      <div>
+        <p class="meta" style="font-size:11px;"><b style="color:#cfdde5;">Bulk Check:</b></p>
+        <ul style="color:var(--muted); font-size:11px; margin:6px 0 0 16px; padding:0;">
+          <li>short workflow, one-shot</li>
+          <li>no sidebar context needed</li>
+          <li>transient state (last-paste persisted, results ephemeral)</li>
+          <li>fits detached-window pattern</li>
+        </ul>
+      </div>
+    </div>
+    <p class="annot" style="margin-top:10px;">Different tool type. Treating it like Dup Review was a category error. Single user knows the feature exists — discovery via popup button is enough.</p>
+  </div>
+
+  <div class="card" style="background:#13171b; border:1px solid #232a30; margin-top:10px;">
+    <h3 style="color:#dce5ed; text-transform:none; letter-spacing:0; font-size:13px;">Implementation notes</h3>
+    <pre style="font-family:Consolas,monospace; font-size:11px; color:#cfdde5; background:#0a0c0e; padding:10px; border-radius:4px; margin:8px 0 0; overflow-x:auto; white-space:pre-wrap;">// Popup launcher click handler
+chrome.windows.create({
+  url: chrome.runtime.getURL('bulk-check.html'),
+  type: 'popup',
+  width: 640,
+  height: 540
+});</pre>
+    <ul style="color:var(--muted); font-size:12px; margin:8px 0 0 16px; padding:0;">
+      <li><b style="color:#dce5ed;">Window dedup:</b> track open bulk-check window ID in <code>chrome.storage.session</code>. Second launcher click focuses existing window instead of spawning duplicate.</li>
+      <li><b style="color:#dce5ed;">State persistence:</b> last paste saved to <code>chrome.storage.local</code> key <code>bulk_check_last_paste</code>. Reopen restores. Results are ephemeral (re-run on reopen).</li>
+      <li><b style="color:#dce5ed;">Backend reuse:</b> calls native host via same messaging path popup search uses. No new backend code.</li>
+      <li><b style="color:#dce5ed;">No back nav:</b> window can't navigate. User closes when done. Ctrl+W closes the bulk window, not a browser tab.</li>
+    </ul>
+  </div>
+
+  <div class="card" style="background:#13171b; border:1px solid #232a30; margin-top:10px;">
+    <h3 style="color:#dce5ed; text-transform:none; letter-spacing:0; font-size:13px;">Edge cases</h3>
+    <ul style="color:var(--muted); font-size:12px; margin:8px 0 0 16px; padding:0;">
+      <li><b style="color:#dce5ed;">Popup auto-closes after launcher click</b> (Chrome behavior). Window survives. Good — that's the intent.</li>
+      <li><b style="color:#dce5ed;">Window positioning unreliable.</b> Chrome treats <code>left/top</code> as hints, multi-monitor users may get the window on the wrong screen. Acceptable for personal-use tool.</li>
+      <li><b style="color:#dce5ed;">Brave / Edge variance.</b> Detached popups behave slightly differently across Chromium forks. Test on user's actual browser before shipping. Fallback if broken: open <code>bulk-check.html</code> in a normal tab via <code>chrome.tabs.create</code>.</li>
+    </ul>
+  </div>
+
+  <div class="card" style="background:#13171b; border:1px solid #232a30; margin-top:10px;">
+    <h3 style="color:#dce5ed; text-transform:none; letter-spacing:0; font-size:13px;">Does NOT generalize</h3>
+    <p class="meta" style="font-size:12px;">Detached-window pattern fits Bulk Check because it's transient + no-sidebar-context + short. Doesn't apply to:</p>
+    <ul style="color:var(--muted); font-size:12px; margin:8px 0 0 16px; padding:0;">
+      <li>Diagnostics — reference info, lives in sidebar fine</li>
+      <li>Setup repair button — already inline in Diagnostics, small enough</li>
+      <li>Dup Review / Cache &amp; Scans / Library Issues — long workflows, sidebar context useful</li>
+      <li>Settings — set-and-forget, not workflow</li>
+    </ul>
+    <p class="annot" style="margin-top:10px;">One-tool answer, not a pattern across the app.</p>
+  </div>
+
+  <!-- ====================================================== -->
+  <h2>5. Execution sequence (final)</h2>
+  <p class="intro">Codex's revised order (triage first, boundary doc second) with my refinements. Risk and dependencies marked. Steps 1–4 are reversible single-file changes (warmup phase). Steps 5–10 = structural. Step 11 = final architectural call.</p>
+
+  <div class="seq-list">
+    <div class="step"><span class="num">1</span><div><b>Per-pane triage</b> <span class="why">— 30 min with user. Decision table above IS this artifact.</span></div><span class="risk low">zero risk</span><span class="deps">no deps</span></div>
+    <div class="step"><span class="num">2</span><div><b>Boundary ownership doc</b> <span class="why">— extension extracts query ID, Python owns filename semantics, host adapts. 1 hour, no code.</span></div><span class="risk low">zero risk</span><span class="deps">after #1</span></div>
+    <div class="step"><span class="num">3</span><div><b>Host fast-path benchmark</b> <span class="why">— latency under idle Python AND under scanning Python. Result gates step 11.</span></div><span class="risk low">measure only</span><span class="deps">no deps</span></div>
+    <div class="step"><span class="num">4</span><div><b>Delete confirmed surfaces</b> <span class="why">— Sim Dupe popup button (no replacement), Transfer wizard (after Diagnostics verification passes).</span></div><span class="risk low">trivial</span><span class="deps">after §3 checklist</span></div>
+    <div class="step"><span class="num">5</span><div><b>CSS extraction from options.html</b> <span class="why">— per-pane CSS files. No behavior change. Bisect-friendly.</span></div><span class="risk low">low</span><span class="deps">after #4</span></div>
+    <div class="step"><span class="num">6</span><div><b>options.js split: Cache &amp; Dup Review paired</b> <span class="why">— Dup Review reads cache state. Single PR extracts both. Keep Ranking moves with Dup Review.</span></div><span class="risk med">moderate</span><span class="deps">after #5</span></div>
+    <div class="step"><span class="num">7</span><div><b>options.js split: Debug Tools + Library Issues + Settings sub-tabs</b> <span class="why">— remaining Options extractions. Inline test components reused across rule editors. Bulk Check is NOT here — it's a new standalone file (step 7a).</span></div><span class="risk med">moderate</span><span class="deps">after #6</span></div>
+    <div class="step"><span class="num">7a</span><div><b>Create <code>bulk-check.html</code> standalone + popup launcher button</b> <span class="why">— new HTML file, own JS module, no Options dependency. Popup gets one button calling <code>chrome.windows.create</code>. Window dedup + state persistence in <code>chrome.storage</code>.</span></div><span class="risk low">additive</span><span class="deps">parallel to #7</span></div>
+    <div class="step"><span class="num">8</span><div><b>Shared fixture corpus</b> <span class="why">— top-level <code>fixtures/</code> (neutral). Python and extension both consume.</span></div><span class="risk low">additive</span><span class="deps">no blocking</span></div>
+    <div class="step"><span class="num">9</span><div><b>Cache contract design</b> <span class="why">— CACHE_VERSION (exists) + ID_RULES_VERSION (new). Schema vs semantics, two concepts.</span></div><span class="risk med">design decision</span><span class="deps">before #10</span></div>
+    <div class="step"><span class="num">10</span><div><b>rc-jav.py module split</b> <span class="why">— ids.py, cache.py, dupes.py, catalog.py, rclone_io.py, cli.py. Tests pre-exist via #8.</span></div><span class="risk med">code churn</span><span class="deps">after #8, #9</span></div>
+    <div class="step"><span class="num">11</span><div><b>Host narrow / keep / delete</b> <span class="why">— based on #3 benchmark. If under-scan responsiveness depends on host = keep narrow. If not = delete.</span></div><span class="risk high">behavior change</span><span class="deps">after #3, #10</span></div>
+  </div>
+
+  <!-- ====================================================== -->
+  <h2>6. Acceptance criteria template</h2>
+  <p class="intro">Each step in the sequence needs three things in the final spec: acceptance criterion, rollback procedure, touched-files list. Without these, "ship order N" is a wish not a plan. Template below — fill per step in spec doc.</p>
+
+  <div class="card" style="background:#13171b; border:1px solid #232a30;">
+    <h3>Template per sequence step</h3>
+    <div style="font-family:Consolas,monospace; font-size:12px; color:#cfdde5; background:#0a0c0e; padding:12px; border-radius:4px; margin-top:8px; white-space:pre-wrap;">step: 6
+title: options.js split — Cache &amp; Dup Review paired
+
+touched_files:
+  - options.html (script tag order changes)
+  - options.js (DELETE: cache section, dup review section, keep ranking section)
+  - options-cache.js (NEW)
+  - options-review.js (NEW)
+  - options-core.js (NEW: shared helpers, pane nav, save/load)
+
+acceptance:
+  - Fresh extension reload, options.html opens
+  - Default landing = Duplicate Review tab
+  - Cache &amp; Scans tab loads, shows last scan timestamp
+  - Run Duplicate Review on existing cache — same result set as pre-refactor
+  - Keep Ranking Rules sub-tab inside Dup Review opens
+  - No console errors on load or interaction
+
+rollback:
+  - git revert &lt;sha&gt;
+  - No data migration. Cache schema unchanged. Storage keys unchanged.
+  - Diagnostics-verified replacement of Transfer wizard remains intact (step 3 already shipped).</div>
+  </div>
+
+  <!-- ====================================================== -->
+  <h2>7. Out of scope (explicitly rejected)</h2>
+  <ul style="color:var(--muted); margin:0 0 30px 18px; font-size:13px;">
+    <li><b style="color:#dce5ed;">Dashboard pane</b> — tab badges replace. Adding a dashboard creates a feature sink.</li>
+    <li><b style="color:#dce5ed;">After-Upload workflow wizard page</b> — sidebar nav order already encodes the workflow.</li>
+    <li><b style="color:#dce5ed;">Matching Lab consolidation page</b> — inline tests cover editor needs, standalone bench in Debug covers diagnostic needs.</li>
+    <li><b style="color:#dce5ed;">Mode switcher top bar (Console / Settings / Support segmented control)</b> — sidebar groups do this.</li>
+    <li><b style="color:#dce5ed;">In-extension Sim Dupe / Debug Preview page</b> — repo HTML file is enough for single-user layout work.</li>
+    <li><b style="color:#dce5ed;">Popup bulk mode toggle</b> — popup stays single-job. Launcher button opens detached window, no inline bulk mode.</li>
+    <li><b style="color:#dce5ed;">Bulk ID Check as Console sidebar tab</b> — wrong tool type for sidebar pattern. Detached window matches its transient nature.</li>
+    <li><b style="color:#dce5ed;">Bulk Check as Options-page deep-link tab</b> — previously considered. Rejected: leaves a leftover tab open after use, Options sidebar adds noise to a one-shot tool.</li>
+    <li><b style="color:#dce5ed;">Frontend framework (React/Vue/Svelte)</b> — vanilla + ordered script files is correct for MV3 + project scale.</li>
+    <li><b style="color:#dce5ed;">Console.log telemetry for usage audit</b> — manual triage of single-user project beats instrumented signals.</li>
+  </ul>
+
+  <h2>8. Net position</h2>
+  <p class="intro" style="margin-bottom:30px;">Architecture decided. Three small user handoffs remain (Diagnostics verification, Recent Activity scope check, popup button label). After those, decision table expands into per-step spec with acceptance + rollback. Code work begins on step 1 (smallest, fastest, lowest risk). Total estimated execution span: phased over multiple PRs, no big-bang refactor.</p>
+
+</main>
+</body>
+</html>
diff --git a/mockups/console-consolidation-options.html b/mockups/console-consolidation-options.html
new file mode 100644
index 0000000..abe511e
--- /dev/null
+++ b/mockups/console-consolidation-options.html
@@ -0,0 +1,355 @@
+<!doctype html>
+<html>
+<head>
+  <meta charset="utf-8">
+  <title>rclone-jav console consolidation direction</title>
+  <style>
+    :root {
+      color-scheme: dark;
+      --bg: #0e1011;
+      --shell: #17191b;
+      --panel: #121416;
+      --surface: #1d2023;
+      --line: #2b3035;
+      --line-2: #3b434b;
+      --text: #dce2e7;
+      --muted: #87939d;
+      --blue: #71c5ff;
+      --green: #7de7a1;
+      --yellow: #ffd36e;
+      --red: #ff8e94;
+      --purple: #c5a9ff;
+    }
+    * { box-sizing: border-box; }
+    body {
+      margin: 0;
+      background: var(--bg);
+      color: var(--text);
+      font: 13px/1.45 -apple-system, BlinkMacSystemFont, "Segoe UI", sans-serif;
+      letter-spacing: 0;
+    }
+    main { padding: 24px; max-width: 1660px; margin: 0 auto; }
+    h1 { margin: 0; font-size: 23px; }
+    h2 { margin: 0 0 10px; font-size: 15px; color: #f4f7fa; }
+    h3 { margin: 0 0 5px; font-size: 12px; text-transform: uppercase; color: #9da9b2; letter-spacing: 0; }
+    p { margin: 0; }
+    .intro { color: var(--muted); max-width: 950px; margin: 5px 0 18px; }
+    .legend { display:flex; gap:7px; flex-wrap:wrap; margin-bottom:18px; }
+    .pill, .badge, button {
+      border: 1px solid var(--line-2);
+      border-radius: 4px;
+      padding: 4px 9px;
+      background: #252a2e;
+      color: var(--text);
+      font: inherit;
+    }
+    .pill { border-radius: 12px; font-size: 11px; }
+    .pill.console { color:var(--green); background:#153020; border-color:#245337; }
+    .pill.settings { color:var(--blue); background:#142838; border-color:#284b66; }
+    .pill.support { color:var(--purple); background:#241d35; border-color:#453363; }
+    .pill.choice { color:var(--yellow); background:#332b16; border-color:#645228; }
+    .grid { display:grid; grid-template-columns: 1fr; gap:18px; align-items:start; }
+    .option {
+      border: 1px solid var(--line);
+      background: #141719;
+      border-radius: 8px;
+      padding: 13px;
+      min-width: 0;
+    }
+    .option-head { display:flex; justify-content:space-between; gap:10px; margin-bottom:10px; align-items:flex-start; }
+    .option-note { color:var(--muted); font-size:12px; }
+    .mock {
+      border:1px solid #333a41;
+      border-radius:8px;
+      background: var(--shell);
+      overflow:hidden;
+      min-height: 420px;
+      width: 100%;
+    }
+    .top {
+      display:flex; align-items:center; justify-content:space-between; gap:12px;
+      padding:11px 13px; border-bottom:1px solid var(--line); background:#111315;
+    }
+    .brand { font-weight:700; color:#fff; font-size:14px; }
+    .tabs, .toolbar, .chips { display:flex; gap:6px; flex-wrap:wrap; align-items:center; }
+    button { padding:5px 10px; border-radius:4px; cursor:default; }
+    button.primary { background:#173923; color:#aaf3bf; border-color:#285b3a; }
+    button.live { background:#143247; color:#98d6ff; border-color:#2e607f; }
+    button.warn { background:#3a3217; color:#ffe28b; border-color:#66552a; }
+    button.danger { background:#3a191d; color:#ffb2b7; border-color:#722c33; }
+    .layout { display:grid; grid-template-columns: 150px minmax(0,1fr); min-height:368px; }
+    .side { background:#101214; border-right:1px solid var(--line); padding:11px; }
+    .g { margin-bottom:13px; }
+    .gtitle { color:#68747d; text-transform:uppercase; letter-spacing:0; font-size:10px; margin:0 0 5px; }
+    .nav { display:grid; gap:3px; }
+    .nav span { display:block; padding:6px 7px; border-radius:4px; color:#aeb8bf; }
+    .nav span.active { background:#27313a; color:#fff; box-shadow:inset 2px 0 var(--blue); }
+    .content { padding:12px; min-width:0; }
+    .heading { display:flex; justify-content:space-between; gap:10px; align-items:start; margin-bottom:10px; }
+    .desc { color:var(--muted); font-size:11px; }
+    .cards { display:grid; gap:9px; }
+    .two { display:grid; grid-template-columns: repeat(2, minmax(0,1fr)); gap:9px; }
+    .three { display:grid; grid-template-columns: repeat(3, minmax(0,1fr)); gap:8px; }
+    .card, .panel, .modal, .popup, .step {
+      border:1px solid var(--line);
+      background:var(--panel);
+      border-radius:6px;
+      padding:10px;
+      min-width:0;
+    }
+    .card strong { color:#fff; }
+    .meta { color:var(--muted); font-size:11px; }
+    .mono { font-family:Consolas, monospace; font-size:11px; }
+    .metric { font-size:18px; color:#fff; font-weight:700; }
+    .line { border-top:1px solid #23282c; margin:8px 0; }
+    .status { border-radius:5px; padding:7px 8px; border:1px solid #294b34; background:#14301e; color:#b6f5c7; }
+    .status.warn { border-color:#5d5225; background:#332d16; color:#ffe188; }
+    .list { display:grid; gap:5px; margin-top:7px; }
+    .row { display:flex; justify-content:space-between; gap:8px; align-items:center; border-top:1px solid #23282c; padding-top:5px; min-width:0; }
+    .row:first-child { border-top:0; padding-top:0; }
+    .path { overflow:hidden; text-overflow:ellipsis; white-space:nowrap; color:#b9c6ce; }
+    .bar { height:5px; background:#272c31; border-radius:99px; overflow:hidden; margin-top:7px; }
+    .fill { height:100%; width:72%; background:linear-gradient(90deg,var(--blue),var(--green)); }
+    .launchers { display:grid; grid-template-columns: repeat(2,minmax(0,1fr)); gap:8px; }
+    .launcher { border:1px dashed #44515b; border-radius:6px; padding:11px; background:#12191f; }
+    .launcher b { display:block; color:#fff; margin-bottom:4px; }
+    .modal-stage { position:relative; min-height:250px; background:#0d1012; border:1px dashed #394149; border-radius:7px; padding:14px; }
+    .modal { width:min(100%, 385px); margin:22px auto 0; box-shadow:0 18px 46px rgba(0,0,0,.45); }
+    .workflow { display:grid; gap:8px; }
+    .step { display:grid; grid-template-columns:28px minmax(0,1fr) auto; align-items:center; gap:8px; }
+    .num { width:24px; height:24px; border-radius:50%; display:grid; place-items:center; background:#18354a; color:var(--blue); font-weight:700; }
+    .popup-stage { display:grid; place-items:center; min-height:340px; background:#0d1012; border:1px dashed #394149; border-radius:7px; padding:14px; }
+    .popup { width:360px; box-shadow:0 14px 42px rgba(0,0,0,.45); }
+    input, textarea {
+      width:100%; background:#0c0e10; color:var(--text); border:1px solid #323940; border-radius:4px;
+      padding:7px 8px; font:12px Consolas, monospace;
+    }
+    textarea { min-height:74px; resize:none; }
+    .seg { display:flex; border:1px solid var(--line-2); border-radius:4px; overflow:hidden; }
+    .seg span { min-width:58px; text-align:center; padding:4px 7px; color:#8b97a0; background:#22272b; border-right:1px solid var(--line-2); font-size:11px; }
+    .seg span:last-child { border-right:0; }
+    .seg span.active { color:var(--blue); background:#173043; }
+    .debug-grid { display:grid; grid-template-columns: 180px minmax(0,1fr); gap:9px; }
+    .preview { border:1px solid #2d3640; background:#101820; border-radius:6px; padding:9px; }
+    .preview-hit { border:1px solid #2d5339; background:#14241a; border-radius:5px; padding:7px; margin-top:7px; }
+    .bench-switch { display:flex; gap:5px; flex-wrap:wrap; margin-bottom:8px; }
+    .bench-switch span { border:1px solid var(--line-2); border-radius:12px; padding:3px 8px; font-size:11px; color:#adb7bf; }
+    .bench-switch span.active { color:var(--yellow); background:#332b16; border-color:#645228; }
+    .verdict { margin-top:9px; color:#aeb8bf; font-size:12px; }
+    @media (max-width: 760px) {
+      main { padding:14px; }
+      .layout, .debug-grid { grid-template-columns:1fr; }
+      .side { border-right:0; border-bottom:1px solid var(--line); }
+      .two, .three, .launchers { grid-template-columns:1fr; }
+      .popup { width:100%; }
+    }
+  </style>
+</head>
+<body>
+<main>
+  <h1>rclone-jav Consolidation Direction</h1>
+  <p class="intro">Updated after the refactor discussion. The page keeps the earlier visual samples, but the decisions are now explicit: launcher-style maintenance console, Duplicate Review as the default work surface, status on navigation instead of a dashboard pane, Bulk ID Check with a popup-launched quick window plus a full Console tool, and debug/testing surfaces pulled out of the daily workflow.</p>
+  <div class="legend">
+    <span class="pill console">Frequent maintenance</span>
+    <span class="pill settings">Set-and-forget settings</span>
+    <span class="pill support">Support / debug</span>
+    <span class="pill choice">Placement decision</span>
+  </div>
+
+  <div class="grid">
+    <section class="option">
+      <div class="option-head"><div><h2>1. Recommended Console Shell</h2><p class="option-note">Frequent maintenance tools get focused destinations. The navigation carries status instead of a separate dashboard pane.</p></div><span class="pill console">chosen direction</span></div>
+      <div class="mock">
+        <div class="top"><span class="brand">rclone-jav Console</span><div class="toolbar"><button>Profile: cq:JAV</button><button>Options</button></div></div>
+        <div class="layout">
+          <aside class="side">
+            <div class="g"><div class="gtitle">Console</div><div class="nav"><span class="active">Duplicate Review [27]</span><span>Cache & Scans [28m]</span><span>Library Issues [4]</span><span>Bulk ID Check</span></div></div>
+            <div class="g"><div class="gtitle">Settings</div><div class="nav"><span>Profiles</span><span>Scan Behavior</span><span>Matching Rules</span><span>Deletion</span></div></div>
+            <div class="g"><div class="gtitle">Support</div><div class="nav"><span>Diagnostics</span><span>Debug Tools</span></div></div>
+          </aside>
+          <div class="content">
+            <div class="heading"><div><h2>Duplicate Review</h2><p class="desc">Default landing after uploads. Keep Ranking Rules and delete history stay with the workflow that uses them.</p></div><span class="pill choice">27 pending</span></div>
+            <div class="two">
+              <div class="card"><h3>Review Queue</h3><div class="metric">12 ready · 2 risky</div><p class="meta">Uses VIP folders, multipart safety, keep reasons, and delete queue checks.</p><div class="chips"><button class="primary">Review Duplicates</button><button>Skipped Risks</button></div></div>
+              <div class="card"><h3>Contextual Config</h3><p>Keep Ranking Rules live inside Duplicate Review, not as a distant general setting.</p><div class="chips"><button>Keep Ranking Rules</button><button>Delete History</button></div></div>
+            </div>
+            <div class="two" style="margin-top:9px;">
+              <div class="card"><h3>Cache Status Lives In Nav</h3><p>Cache & Scans owns the scan detail. The sidebar badge is enough while you review dupes.</p><button>Open Cache & Scans</button></div>
+              <div class="card"><h3>Console Neighbors</h3><p>Library Issues and Bulk ID Check remain direct tools, not settings fieldsets.</p><div class="chips"><button>Library Issues</button><button>Bulk ID Check</button></div></div>
+            </div>
+          </div>
+        </div>
+      </div>
+      <p class="verdict">Chosen: Console / Settings / Support sidebar, Duplicate Review first, no dashboard pane.</p>
+    </section>
+
+    <section class="option">
+      <div class="option-head"><div><h2>2. Launcher Treatment</h2><p class="option-note">The page should open focused maintenance views instead of collecting every heavy tool as a permanent fieldset.</p></div><span class="pill console">chosen pattern</span></div>
+      <div class="mock">
+        <div class="top"><span class="brand">Library Console</span><div class="tabs"><button class="live">Console</button><button>Settings</button><button>Support</button></div></div>
+        <div class="content">
+          <div class="two">
+            <div class="card"><h3>Cache Status</h3><div class="status">Fresh cache · cq:JAV · last scan 28m ago</div><div class="chips" style="margin-top:8px;"><button class="primary">Update Cache</button><button>Open Cache Console</button></div></div>
+            <div class="card"><h3>Next Maintenance</h3><p class="meta">Large tools stay out of the page until you open them.</p><div class="chips" style="margin-top:8px;"><button class="primary">Review Duplicates</button><button>Bulk Check</button><button>Library Issues</button></div></div>
+          </div>
+          <div class="modal-stage" style="margin-top:10px;">
+            <div class="meta">Example focused tool opened from a launcher</div>
+            <div class="modal">
+              <div class="heading"><div><h2>Duplicate Review</h2><p class="desc">Full space for filters, keep reasons, and delete queue safety.</p></div><button>x</button></div>
+              <div class="status warn">2 risky groups skipped by default</div>
+              <div class="list">
+                <div class="row"><span class="path">JBD-291 ClearJAV vs older MP4</span><span class="badge">KEEP</span></div>
+                <div class="row"><span class="path">OFJE-195 multipart warning</span><span class="badge">REVIEW</span></div>
+              </div>
+            </div>
+          </div>
+        </div>
+      </div>
+      <p class="verdict">Chosen for the big surfaces: Duplicate Review, Cache & Scans, Library Issues, and Bulk ID Check.</p>
+    </section>
+
+    <section class="option">
+      <div class="option-head"><div><h2>3. Boundary Without A Mode Switcher</h2><p class="option-note">Console, Settings, and Support stay distinct through sidebar groups, not a second top-level mode control.</p></div><span class="pill settings">chosen boundary</span></div>
+      <div class="mock">
+        <div class="top"><span class="brand">rclone-jav</span><div class="toolbar"><button class="live">Console</button><button>Settings</button><button>Support</button></div></div>
+        <div class="layout">
+          <aside class="side">
+            <div class="g"><div class="gtitle">Console</div><div class="nav"><span class="active">After Upload</span><span>Cache & Scans</span><span>Duplicate Review</span><span>Bulk ID Check</span></div></div>
+          </aside>
+          <div class="content">
+            <div class="three">
+              <div class="card"><span class="pill console">Console</span><h2 style="margin-top:7px;">Maintenance</h2><p class="meta">Review the library repeatedly.</p></div>
+              <div class="card"><span class="pill settings">Settings</span><h2 style="margin-top:7px;">Configure</h2><p class="meta">Profiles, rules, overlays, deletion.</p></div>
+              <div class="card"><span class="pill support">Support</span><h2 style="margin-top:7px;">Troubleshoot</h2><p class="meta">Diagnostics, debug benches, setup.</p></div>
+            </div>
+            <div class="panel" style="margin-top:9px;">
+              <h3>Settings mode would look quieter</h3>
+              <div class="chips"><button>Profiles</button><button>Scan Behavior</button><button>Overlays</button><button>Site Extraction</button><button>ID Rules</button><button>Deletion</button></div>
+            </div>
+          </div>
+        </div>
+      </div>
+      <p class="verdict">Chosen conceptually, simplified visually: sidebar groups do the separating work.</p>
+    </section>
+
+    <section class="option">
+      <div class="option-head"><div><h2>4. No Workflow Wizard</h2><p class="option-note">The maintenance order is real, but it should be encoded by the Console tools themselves rather than another page.</p></div><span class="pill choice">rejected surface</span></div>
+      <div class="mock">
+        <div class="top"><span class="brand">Console Order</span><div class="toolbar"><button>Profile: cq:JAV</button><button>Settings</button></div></div>
+        <div class="content">
+          <div class="heading"><div><h2>Maintenance stays obvious</h2><p class="desc">The sidebar and focused tools make the flow clear without adding a separate wizard surface.</p></div></div>
+          <div class="workflow">
+            <div class="step"><span class="num">1</span><div><strong>Refresh cache</strong><div class="meta">Update changed files from configured roots.</div></div><button class="primary">Update 24h</button></div>
+            <div class="step"><span class="num">2</span><div><strong>Review skipped names</strong><div class="meta">Spot files that did not produce an ID.</div></div><button>Review Skipped</button></div>
+            <div class="step"><span class="num">3</span><div><strong>Review duplicates</strong><div class="meta">KEEP reasons and multipart-risk skips included.</div></div><button class="primary">Open Review</button></div>
+            <div class="step"><span class="num">4</span><div><strong>Check library issues</strong><div class="meta">Rename bracket/no-hyphen oddities if needed.</div></div><button>Open Issues</button></div>
+          </div>
+          <div class="panel" style="margin-top:9px;"><div class="chips"><span class="pill choice">Utility</span><button>Bulk ID Check</button><button>Cache Console</button><button>Ranking Rules</button></div></div>
+        </div>
+      </div>
+      <p class="verdict">Rejected as a dedicated home page. Useful order, unnecessary extra destination.</p>
+    </section>
+
+    <section class="option">
+      <div class="option-head"><div><h2>5. Rejected: Bulk Mode Inside Popup</h2><p class="option-note">This would turn the popup into a two-mode mini-app with cramped result review.</p></div><span class="pill choice">rejected</span></div>
+      <div class="popup-stage">
+        <div class="popup">
+          <div class="heading"><span class="brand">rclone-jav</span><div class="toolbar"><div class="seg"><span class="active">LIVE</span><span>CACHE</span></div><button>gear</button></div></div>
+          <div class="seg" style="margin-bottom:8px;"><span>Single</span><span class="active">Bulk</span></div>
+          <textarea>BLK-474&#10;FC2-PPV-1841460&#10;PRTD-[027-030]</textarea>
+          <div class="chips" style="margin:7px 0;"><button class="primary">Check IDs</button><button>Clear</button></div>
+          <div class="status">6 IDs checked · 4 match · 2 no match</div>
+          <div class="list">
+            <div class="row"><span class="path">BLK-474</span><span class="pill console">MATCH</span></div>
+            <div class="row"><span class="path">PRTD-029</span><span class="pill choice">NO MATCH</span></div>
+            <div class="row"><span class="path">FC2-PPV-1841460</span><span class="pill console">MATCH</span></div>
+          </div>
+        </div>
+      </div>
+      <p class="verdict">Rejected even for 5-20 IDs. The popup gets a doorway into a focused Bulk Check surface, not a permanent second mode.</p>
+    </section>
+
+    <section class="option">
+      <div class="option-head"><div><h2>6. Chosen: Bulk Check Quick Window</h2><p class="option-note">Typical batches are expected to be about 5-20 IDs, so the popup opens a compact focused window while the Console owns the full tool.</p></div><span class="pill console">chosen bulk path</span></div>
+      <div class="popup-stage">
+        <div class="three" style="width:100%; align-items:start;">
+          <div class="popup">
+            <div class="heading"><span class="brand">rclone-jav</span><button>gear</button></div>
+            <input value="BLK-474">
+            <div class="status" style="margin-top:8px;">MATCH · 1 hit</div>
+            <div class="chips" style="margin-top:8px;"><button>Re-Scan</button><button class="live">Bulk Check</button></div>
+          </div>
+          <div class="modal">
+            <div class="heading"><div><h2>Bulk Check</h2><p class="desc">Quick batch window</p></div><button>x</button></div>
+            <textarea>BLK-474&#10;FC2-PPV-1841460&#10;PRTD-027</textarea>
+            <div class="chips" style="margin-top:7px;"><button class="primary">Check IDs</button><button>Clear</button></div>
+            <div class="status" style="margin-top:8px;">3 IDs · 2 match · 1 no match</div>
+            <div class="list">
+              <div class="row"><span class="path">BLK-474</span><span class="pill console">MATCH</span></div>
+              <div class="row"><span class="path">PRTD-027</span><span class="pill choice">NO MATCH</span></div>
+            </div>
+            <div class="chips" style="margin-top:8px;"><button>Open Full Console</button></div>
+          </div>
+          <div class="card">
+            <h3>Console Owner</h3>
+            <textarea>Paste larger batches here...</textarea>
+            <div class="chips" style="margin-top:7px;"><button class="primary">Check IDs</button><button>Export Results</button></div>
+            <p class="meta" style="margin-top:7px;">Full-width rows, richer review, ranges, import/export, future filters.</p>
+          </div>
+        </div>
+      </div>
+      <p class="verdict">Chosen: popup opens a compact Bulk Check window for short batches. The Console remains the full batch-review surface.</p>
+    </section>
+
+    <section class="option">
+      <div class="option-head"><div><h2>7. Debug Split + Repo Preview</h2><p class="option-note">Debug history and standalone tests move out of daily workflow. Sim Dupe leaves the extension UI entirely.</p></div><span class="pill support">chosen support split</span></div>
+      <div class="mock">
+        <div class="top"><span class="brand">Support / Debug Tools</span><button>Diagnostics</button></div>
+        <div class="content debug-grid">
+          <div class="card">
+            <h3>Debug Tools</h3>
+            <div class="nav"><span class="active">Search Activity</span><span>Search Troubleshooting</span><span>ID Extraction</span><span>Page Extraction</span><span>Diagnostics</span></div>
+          </div>
+          <div class="preview">
+            <div class="heading"><div><h2>Repo Preview Harness</h2><p class="desc">Popup state samples live in a repo HTML file such as <span class="mono">samples/popup-states.html</span>, not as a hidden extension page.</p></div></div>
+            <div class="chips"><button>Open sample file</button><button class="live">Search Activity</button><button>Diagnostics</button></div>
+            <div class="preview-hit">
+              <div class="status">MATCH · sample popup state</div>
+              <div class="list"><div class="row"><span class="path">BLK-474 - ClearJAV.mp4</span><span>4.94 GiB</span></div><div class="row"><span class="path">BLK-474 [1080p].mp4</span><span>4.90 GiB</span></div></div>
+            </div>
+          </div>
+        </div>
+      </div>
+      <p class="verdict">Chosen: standalone support/debug tools remain available; Sim Dupe is removed from extension UI.</p>
+    </section>
+
+    <section class="option">
+      <div class="option-head"><div><h2>8. Inline Rule Feedback</h2><p class="option-note">Rule editors keep local feedback. Only standalone troubleshooting benches move to Debug Tools.</p></div><span class="pill support">chosen bench split</span></div>
+      <div class="mock">
+        <div class="top"><span class="brand">Settings / Matching Rules</span><span class="pill choice">feedback stays nearby</span></div>
+        <div class="content">
+          <div class="bench-switch"><span class="active">Custom Part Detector</span><span>ID Normalizer</span><span>Site Extraction</span></div>
+          <div class="two">
+            <div class="card">
+              <h3>Rule</h3>
+              <textarea>_PART(\d+)$</textarea>
+              <div class="chips" style="margin-top:7px;"><button class="primary">Test this rule</button><button>Use samples</button></div>
+            </div>
+            <div class="card">
+              <h3>Inline Feedback</h3>
+              <div class="list">
+                <div class="row"><span>KV-118_PART1.mp4</span><span class="pill settings">part 1</span></div>
+                <div class="row"><span>KV-118_PART2.mp4</span><span class="pill settings">part 2</span></div>
+                <div class="row"><span>Covered by built-in?</span><span class="pill console">shown</span></div>
+              </div>
+            </div>
+          </div>
+          <div class="panel" style="margin-top:9px;"><p class="meta">Standalone Search Troubleshooting, page extraction testing, and search history can still move into Support. Editing rules should not require leaving the editor to see feedback.</p></div>
+        </div>
+      </div>
+      <p class="verdict">Chosen: contextual inline tests stay. General troubleshooting tools move to Support.</p>
+    </section>
+  </div>
+</main>
+</body>
+</html>
diff --git a/rc-jav.py b/rc-jav.py
new file mode 100644
index 0000000..37fc844
--- /dev/null
+++ b/rc-jav.py
@@ -0,0 +1,2230 @@
+#!/usr/bin/env python3
+"""Scan rclone remotes for duplicate JAV files grouped by ID."""
+from __future__ import annotations
+
+import argparse
+import csv
+import fnmatch
+import json
+import os
+import re
+import subprocess
+import sys
+import threading
+import time
+import xml.etree.ElementTree as ET
+from dataclasses import dataclass, asdict
+from datetime import datetime
+from pathlib import Path
+from typing import Iterable
+
+from rich.console import Console
+from rich.panel import Panel
+from rich.progress import (
+    BarColumn,
+    MofNCompleteColumn,
+    Progress,
+    SpinnerColumn,
+    TextColumn,
+    TimeElapsedColumn,
+    TimeRemainingColumn,
+)
+from rich.table import Table
+from rich.text import Text
+
+PRIMARY_ID_RE = re.compile(r"^([A-Za-z]+)-(\d+)")
+FALLBACK_ID_RE = re.compile(r"^([A-Za-z0-9]+)-(\d+)")
+COMPOUND_ID_RE = re.compile(r"^([A-Za-z0-9]+(?:-[A-Za-z0-9]+)+)-(\d+)")
+
+# Part-suffix patterns: anchored at end of stem (after stripping extension).
+# Each pattern's group(1) is the part number.
+RANGE_RE = re.compile(r"\[(\d+)-(\d+)\]")
+
+# Non-anchored XofY probe used in detect_part() to resolve the priority conflict
+# between a trailing (N) copy-marker suffix and an embedded XofY part indicator.
+# Example: "ENKI-031 [1080p].2of2 (1)" — the (1) is a filesystem collision suffix
+# (rclone, Windows copy), not a part number; the 2of2 is the real part indicator.
+# This pattern intentionally has no end-anchor so it matches anywhere in the stem.
+_XOFY_PRIORITY_RE = re.compile(r"[._ -](\d+)\s*of\s*\d+", re.IGNORECASE)
+
+BUILTIN_PART_RES = [
+    re.compile(r"[-_ ](?:pt|part|cd|disc)[-_ ]?(\d+)$", re.IGNORECASE),
+    re.compile(r"\s*\((\d+)(?:\s*of\s*\d+)?\)$", re.IGNORECASE),
+    # Exported multipart filenames often end in `.1of2` / `-2 of 4`.
+    re.compile(r"[._ -](\d+)\s*of\s*\d+$", re.IGNORECASE),
+    # Bare numeric suffixes (`_N`, ` N`) are only treated as part numbers when
+    # the number is 1-2 digits. Wider patterns falsely matched resolution tags
+    # (`_2160`, `_4K2160`) and dates/years (`SSIS-001 2023.mp4` -> `#part2023`),
+    # corrupting cache keys.
+    # Staged detection also retries after resolution/actress cleanup, so end
+    # anchors can match both raw suffixes and metadata-blocked suffixes safely.
+    re.compile(r"_(\d{1,2})$"),
+    # Hyphen short-part suffix after the ID, e.g. OFJE-195-1 [480p].mp4.
+    # Limit to 1-2 digits so the base ID's usual 3+ digit numeric component
+    # does not make every canonical `ABC-123` filename look multipart.
+    re.compile(r"-(\d{1,2})$"),
+    # Lettered parts: separator (hyphen or underscore) followed by A-D.
+    # Uppercase only — lowercase letters are variant designators (e.g. IBW-902z)
+    # and are preserved as part of the base ID, not treated as part numbers.
+    re.compile(r"[-_]([A-D])$"),
+    # Bare uppercase letter directly after the ID digits with no separator,
+    # e.g. BAK-052A, BAK-052B.  Lookbehind ensures a digit precedes.
+    re.compile(r"(?<=\d)([A-D])$"),
+    re.compile(r"\s+(\d{1,2})$"),
+]
+PART_RES = list(BUILTIN_PART_RES)
+
+
+def configure_part_patterns(patterns: Iterable[str]) -> list[str]:
+    """Extend part suffix detection with user regexes whose first group is part number."""
+    global PART_RES
+    PART_RES = list(BUILTIN_PART_RES)
+    errors: list[str] = []
+    for pattern in patterns:
+        pattern = str(pattern or "").strip()
+        if not pattern:
+            continue
+        try:
+            compiled = re.compile(pattern, re.IGNORECASE)
+        except re.error as e:
+            errors.append(f"{pattern!r}: {e}")
+            continue
+        if compiled.groups < 1:
+            errors.append(f"{pattern!r}: needs a capture group for the part number")
+            continue
+        PART_RES.append(compiled)
+    return errors
+
+
+def detect_part(stem: str) -> str | None:
+    """Return part number as string if stem ends with a part suffix, else None.
+
+    XofY (e.g. .2of2) anywhere in the stem takes unconditional priority over a
+    trailing (N) suffix.  A file named 'ENKI-031 [1080p].2of2 (1).mp4' is part 2;
+    the trailing (1) is a filesystem copy-collision marker (rclone / Windows),
+    not a part number.  Without this pre-check the ordered PART_RES list would
+    match (1) first and misclassify the file as part 1.
+    """
+    m = _XOFY_PRIORITY_RE.search(stem)
+    if m:
+        return m.group(1)
+    for r in PART_RES:
+        m = r.search(stem)
+        if m:
+            return m.group(1)
+    return None
+
+
+def part_key(part: str) -> str:
+    token = str(part or "").strip()
+    if token.isdigit():
+        return str(int(token))
+    if len(token) == 1 and token.isalpha():
+        return str(ord(token.upper()) - ord("A") + 1)
+    return token.upper()
+
+
+@dataclass
+class FileEntry:
+    source: str        # "Source" (priority) or "Target"
+    remote: str        # the rclone remote:path root supplied
+    path: str          # relative path within remote
+    size: int
+    mod_time: str
+    jav_id: str        # normalized, e.g. "SSIS-1"
+
+    @property
+    def full_path(self) -> str:
+        sep = "" if self.remote.endswith("/") or not self.path else "/"
+        return f"{self.remote}{sep}{self.path}"
+
+
+
+def human_size(n: int) -> str:
+    nf = float(max(0, n))
+    for unit in ("B", "KiB", "MiB", "GiB", "TiB"):
+        if nf < 1024:
+            return f"{int(nf)} B" if unit == "B" else f"{nf:.2f} {unit}"
+        nf /= 1024
+    return f"{nf:.2f} PiB"
+
+
+# Matches a trailing lowercase letter variant designator, e.g. the 'z' in IBW-902z.
+_VARIANT_SUFFIX_RE = re.compile(r"^(.+?)([a-z])$")
+
+# Strips `[resolution]` and ` - Actress Name` from a stem so that part-suffix
+# patterns anchored at `$` fire correctly.
+# Canonical naming: {ID}[-{part}][ - {actress}][ [{resolution}]]
+_RESOLUTION_TAG_RE = re.compile(r"\s*\[[^\]]*\]\s*$")
+
+# Bracket-wrapped ID: [REAL-779] or [HODV-21076] Saki Hatsumi [1080p]
+_BRACKET_ID_RE = re.compile(r"^\[([^\]]+)\]")
+_RES_LABEL_RE = re.compile(r"\[(?:2160|1080|720|480)p\]", re.IGNORECASE)
+_VIDEO_EXTS = {
+    ".avi", ".flv", ".m2ts", ".m4v", ".mkv", ".mov", ".mp4", ".mpeg",
+    ".mpg", ".ts", ".webm", ".wmv",
+}
+_LOWEST_KEEP_PRIORITY_EXTS = {".ts"}
+
+# No-hyphen ID fallback: MVSD312 → MVSD-312 (letters-only prefix + digits, no hyphen)
+_NOHYPHEN_ID_RE = re.compile(r"^([A-Za-z]{2,8})(\d{3,6})")
+
+
+def _clean_stem_for_parts(stem: str) -> str:
+    """Return stem with trailing [tag] and ' - Actress' stripped.
+    Resolution is always the last bracketed token; actress follows ' - '."""
+    s = _RESOLUTION_TAG_RE.sub("", stem).strip()
+    if " - " in s:
+        s = s[:s.index(" - ")].strip()
+    return s
+
+
+def _part_detection_stems(stem: str) -> list[str]:
+    """Return stem stages for part detection from least to most cleaned."""
+    resolution_clean = _RESOLUTION_TAG_RE.sub("", stem).strip()
+    actress_clean = _clean_stem_for_parts(stem)
+    out: list[str] = []
+    for candidate in (stem, resolution_clean, actress_clean):
+        if candidate and candidate not in out:
+            out.append(candidate)
+    return out
+
+
+def detect_part_from_stem(stem: str) -> str | None:
+    """Try part suffix rules before and after metadata cleanup."""
+    for candidate in _part_detection_stems(stem):
+        part = detect_part(candidate)
+        if part:
+            return part
+    return None
+
+
+def extract_id(name: str) -> str | None:
+    stem = Path(name).stem
+
+    # Strip bracket wrapper: [REAL-779] → REAL-779, [SCOP-297] [1080p] → SCOP-297
+    effective_stem = stem
+    if stem.startswith("["):
+        bm = _BRACKET_ID_RE.match(stem)
+        if bm:
+            effective_stem = bm.group(1).strip()
+
+    m = PRIMARY_ID_RE.match(effective_stem)
+    if not m:
+        m = COMPOUND_ID_RE.match(effective_stem)
+    if not m:
+        m = FALLBACK_ID_RE.match(effective_stem)
+    if not m:
+        # No-hyphen fallback: MVSD312 → MVSD-312
+        m = _NOHYPHEN_ID_RE.match(effective_stem)
+    if not m:
+        return None
+
+    num = int(m.group(2))
+    width = max(3, len(m.group(2)))
+    prefix = m.group(1).upper()
+    if prefix == "FC2":
+        prefix = "FC2-PPV"
+
+    # Check the character immediately after the matched digits.
+    # Lowercase → variant designator (e.g. IBW-902z): fold into the base ID.
+    # Uppercase A-D → part letter: handled below by detect_part.
+    # Anything else (space, '[', end-of-string) → no variant.
+    after = effective_stem[m.end():m.end() + 1]
+    variant = after if after.islower() else ""
+
+    base = f"{prefix}-{num:0{width}d}{variant}"
+
+    # Use original stem (not effective_stem) so bracket-wrapped filenames like
+    # [REAL-779-1].mp4 still get part detection applied to the full stem.
+    # Run before and after metadata cleanup: raw suffixes such as
+    # "KV-118 - Actress_PART1" must survive, while trailing [1080p] tags still
+    # need cleanup before end-anchored detectors can match.
+    part = detect_part_from_stem(stem)
+    return f"{base}#part{part_key(part)}" if part else base
+
+
+def normalize_id(raw: str) -> str | None:
+    return extract_id(raw + ".x")  # add dummy ext so stem keeps the ID intact
+
+
+def describe_id_match(display_query: str, matched_query: str, matched_id: str,
+                      expansion_count: int) -> dict[str, str]:
+    """Explain the matcher path used for one ID hit in JSON output."""
+    if "*" in matched_query or "?" in matched_query:
+        kind, label, confidence = "wildcard", "Wildcard ID", "broad"
+    elif expansion_count > 1:
+        kind, label, confidence = "range", "Range member", "expanded"
+    elif "#part" in matched_query:
+        kind, label, confidence = "exact_part", "Exact part ID", "high"
+    elif matched_id.startswith(matched_query + "#part"):
+        kind, label, confidence = "part", "Base ID + part", "related"
+    elif display_query.upper() != matched_query.upper():
+        kind, label, confidence = "normalized", "Normalized ID", "normalized"
+    else:
+        kind, label, confidence = "exact", "Exact ID", "high"
+    return {
+        "match_kind": kind,
+        "match_reason": label,
+        "match_confidence": confidence,
+        "matched_query": matched_query,
+        "matched_id": matched_id,
+    }
+
+
+def expand_range(raw: str) -> list[str] | None:
+    """Expand a bracket range like 'IPZZ-[820-860]' into individual ID strings.
+    Returns None if no range marker present."""
+    m = RANGE_RE.search(raw)
+    if not m:
+        return None
+    a, b = int(m.group(1)), int(m.group(2))
+    lo, hi = (a, b) if a <= b else (b, a)
+    width = max(len(m.group(1)), len(m.group(2)))  # preserve zero-padding
+    return [raw[:m.start()] + f"{n:0{width}d}" + raw[m.end():] for n in range(lo, hi + 1)]
+
+
+RCLONE_BIN = "rclone"
+BASIC = False  # set by --basic
+USE_ANSI = True  # disabled by --no-color
+
+# Pre-rich ANSI codes (used in --basic mode for color).
+ANSI_RESET = "\033[0m"
+ANSI_GREEN = "\033[32m"
+ANSI_RED = "\033[31m"
+ANSI_YELLOW = "\033[33m"
+ANSI_CYAN = "\033[36m"
+ANSI_DIM = "\033[2m"
+ANSI_BOLD = "\033[1m"
+
+
+def ansi(s: str, code: str) -> str:
+    return f"{code}{s}{ANSI_RESET}" if USE_ANSI else s
+console = Console()  # replaced in main() if --no-color
+
+
+_RICH_TAG_RE = re.compile(r"\[/?[^\]]*\]")
+
+
+def strip_markup(s: str) -> str:
+    return _RICH_TAG_RE.sub("", s)
+
+
+class BasicProgress:
+    """Minimal stand-in for rich.Progress used when --basic is set."""
+    def __init__(self):
+        self._tasks: dict[int, dict] = {}
+        self._next = 0
+        self._last_print: dict[int, int] = {}
+
+    def __enter__(self):
+        return self
+
+    def __exit__(self, *exc):
+        for tid, t in self._tasks.items():
+            sys.stderr.write(f"{ansi('[done]', ANSI_GREEN)} {t['desc']}  {t['done']}/{t['total']}\n")
+        return False
+
+    def add_task(self, description: str, total: int = 1) -> int:
+        tid = self._next
+        self._next += 1
+        desc = strip_markup(description)
+        self._tasks[tid] = {"desc": desc, "total": total, "done": 0}
+        self._last_print[tid] = 0
+        sys.stderr.write(f"{ansi('[start]', ANSI_CYAN)} {desc}\n")
+        return tid
+
+    def update(self, tid, total=None, description=None, **_):
+        t = self._tasks[tid]
+        if total is not None:
+            t["total"] = total
+        if description is not None:
+            t["desc"] = strip_markup(description)
+
+    def advance(self, tid, n: int = 1):
+        t = self._tasks[tid]
+        t["done"] += n
+        # In-place refresh every 5 files (or every file if total small).
+        step = 5 if t["total"] > 50 else 1
+        if t["done"] - self._last_print[tid] >= step or t["done"] == t["total"]:
+            counter = ansi(f"{t['done']}/{t['total']}", ANSI_CYAN)
+            line = f"  {counter}  {ansi(t['desc'], ANSI_DIM)}"
+            if sys.stderr.isatty():
+                sys.stderr.write(f"\r\033[K{line}")
+                if t["done"] == t["total"]:
+                    sys.stderr.write("\n")
+                sys.stderr.flush()
+            elif t["done"] == t["total"]:
+                # Non-TTY: only print final line, skip intermediate noise.
+                sys.stderr.write(line + "\n")
+            self._last_print[tid] = t["done"]
+
+# Default remotes used when --search is invoked without explicit --source/--target.
+DEFAULT_SOURCE = ["cq:personal-files/ClearJAV"]
+DEFAULT_TARGET = ["cq:personal-files/JAV/TMP"]
+
+# Default WinCatalog export folder (or specific files). Folder entries auto-discover *.csv / *.xml.
+DEFAULT_CATALOG: list[str] = [str(Path(__file__).resolve().parent / "wincatalog")]
+
+# CSV column synonyms (lowercased) — first matching one wins.
+CATALOG_COL_NAME = ("name", "file name", "filename", "title")
+CATALOG_COL_PATH = ("path", "full path", "location", "folder")
+CATALOG_COL_SIZE = ("size", "file size", "bytes", "size (bytes)")
+CATALOG_COL_DISC = ("disc", "disc name", "disc label", "volume", "source", "catalog", "media")
+
+CACHE_PATH = Path(__file__).resolve().parent / "cache.json"
+CACHE_VERSION = 3  # bumped: extract_id handles bracket-wrapped IDs + no-hyphen fallback
+CACHE_STALE_HOURS = 24
+
+DEFAULT_KEEP_RANKING: dict = {
+    "priority_folders": ["ClearJAV"],
+    "size_tolerance_mib": 0,
+    "format_preference": ["mkv", "mp4", "wmv", "avi"],
+    "tiebreak_res_tag": True,
+    "tiebreak_longer_name": True,
+}
+# Module-level ranking config; set from config.json in main() so all call sites pick it up.
+_KEEP_RANKING: dict = {}
+
+CONFIG_PATH = Path(__file__).resolve().parent / "config.json"
+
+# Written by the native-messaging host when the user clicks Cancel in the
+# extension popup. walk_remote checks for it every CANCEL_CHECK_INTERVAL files
+# and exits cleanly if found.
+CANCEL_FLAG = Path(__file__).resolve().parent / "scan-cancel.flag"
+CANCEL_CHECK_INTERVAL = 100   # check / emit progress every N files
+
+
+def load_config() -> dict:
+    if not CONFIG_PATH.exists():
+        return {}
+    try:
+        data = json.loads(CONFIG_PATH.read_text(encoding="utf-8"))
+        if not isinstance(data, dict):
+            return {}
+        return data
+    except (json.JSONDecodeError, OSError):
+        return {}
+
+
+def save_config(cfg: dict) -> None:
+    tmp = CONFIG_PATH.with_suffix(CONFIG_PATH.suffix + ".tmp")
+    tmp.write_text(json.dumps(cfg, indent=2), encoding="utf-8")
+    os.replace(tmp, CONFIG_PATH)
+
+
+def load_cache() -> dict:
+    if not CACHE_PATH.exists():
+        return {"version": CACHE_VERSION, "remotes": {}}
+    try:
+        data = json.loads(CACHE_PATH.read_text(encoding="utf-8"))
+        if (
+            not isinstance(data, dict)
+            or data.get("version") != CACHE_VERSION
+            or not isinstance(data.get("remotes"), dict)
+        ):
+            if isinstance(data, dict) and "version" in data and data["version"] != CACHE_VERSION:
+                sys.stderr.write(
+                    f"[warn] cache version mismatch (got {data['version']}, "
+                    f"expected {CACHE_VERSION}); forcing full rescan.\n"
+                )
+            return {"version": CACHE_VERSION, "remotes": {}}
+        return data
+    except (json.JSONDecodeError, OSError):
+        return {"version": CACHE_VERSION, "remotes": {}}
+
+
+def save_cache(cache: dict) -> None:
+    # Write to a sibling tmp file then atomically replace, so a killed mid-write
+    # (Ctrl-C, power loss, concurrent --scan) can't leave a half-written
+    # cache.json — load_cache would otherwise see invalid JSON and fall back to
+    # an empty cache, forcing a full re-scan.
+    tmp = CACHE_PATH.with_suffix(CACHE_PATH.suffix + ".tmp")
+    tmp.write_text(json.dumps(cache, indent=2), encoding="utf-8")
+    try:
+        os.replace(tmp, CACHE_PATH)
+    except PermissionError:
+        # Windows: destination may be briefly locked by antivirus or a concurrent reader.
+        time.sleep(0.5)
+        os.replace(tmp, CACHE_PATH)
+
+
+def cache_age_hours(scanned_at: str) -> float | None:
+    try:
+        dt = datetime.fromisoformat(scanned_at.replace("Z", "+00:00"))
+    except ValueError:
+        return None
+    now = datetime.now(dt.tzinfo) if dt.tzinfo else datetime.now()
+    return (now - dt).total_seconds() / 3600.0
+
+
+def fmt_age(hours: float) -> str:
+    if hours < 1:
+        return f"{int(hours * 60)}m"
+    if hours < 24:
+        return f"{hours:.1f}h"
+    return f"{hours / 24:.1f}d"
+
+
+# ---------- WinCatalog ingest ----------
+
+def _pick_col(headers_lower: list[str], synonyms: tuple[str, ...]) -> str | None:
+    for s in synonyms:
+        if s in headers_lower:
+            return s
+    return None
+
+
+def normalize_catalog_path(path: str) -> str:
+    """Keep catalog paths display-compatible with rclone-style path consumers."""
+    p = (path or "").replace("\\", "/")
+    if p.startswith("//"):
+        return "//" + re.sub(r"/+", "/", p[2:])
+    return re.sub(r"/+", "/", p)
+
+
+def load_catalog_csv(path: Path, skipped: list[tuple[str, str]]) -> list[FileEntry]:
+    """Load a WinCatalog CSV export. Lenient about column names."""
+    entries: list[FileEntry] = []
+    with path.open("r", encoding="utf-8-sig", newline="") as f:
+        # Sniff delimiter
+        sample = f.read(4096)
+        f.seek(0)
+        try:
+            dialect = csv.Sniffer().sniff(sample, delimiters=",;\t|")
+        except csv.Error:
+            dialect = csv.excel
+        reader = csv.DictReader(f, dialect=dialect)
+        if not reader.fieldnames:
+            return entries
+        headers: dict[str, str] = {}
+        for h in reader.fieldnames:
+            hl = h.lower()
+            if hl not in headers:
+                headers[hl] = h
+        col_name = _pick_col(list(headers), CATALOG_COL_NAME)
+        col_path = _pick_col(list(headers), CATALOG_COL_PATH)
+        col_size = _pick_col(list(headers), CATALOG_COL_SIZE)
+        col_disc = _pick_col(list(headers), CATALOG_COL_DISC)
+        if not col_name and not col_path:
+            console.print(f"[yellow]WARN: catalog CSV {path} has no Name/Path columns; skipping.[/]")
+            return entries
+        for row in reader:
+            name = (row.get(headers[col_name]) if col_name else "") or ""
+            full_path = (row.get(headers[col_path]) if col_path else "") or ""
+            if not name and full_path:
+                name = Path(full_path).name
+            full_path = normalize_catalog_path(full_path)
+            if not name:
+                continue
+            jav_id = extract_id(name)
+            if not jav_id:
+                skipped.append((f"catalog:{path.name}", full_path or name))
+                continue
+            try:
+                size = int(row.get(headers[col_size], 0)) if col_size else 0
+            except (ValueError, TypeError):
+                size = 0
+            disc = (row.get(headers[col_disc]) if col_disc else "") or ""
+            # Encode disc label into "remote" so it surfaces in output.
+            remote_label = f"catalog:{disc}" if disc else f"catalog:{path.name}"
+            entries.append(FileEntry(
+                source="Catalog", remote=remote_label,
+                path=full_path or name, size=size, mod_time="",
+                jav_id=jav_id,
+            ))
+    return entries
+
+
+def _strip_xml_ns(tag: str) -> str:
+    """Remove Clark-notation namespace {uri}local → local."""
+    return tag.split("}")[-1] if "}" in tag else tag
+
+
+def load_catalog_xml(path: Path, skipped: list[tuple[str, str]]) -> list[FileEntry]:
+    """Load a WinCatalog XML export. Walks for any element with file-like attrs."""
+    entries: list[FileEntry] = []
+    tree = ET.parse(str(path))
+    root = tree.getroot()
+
+    def walk(node, disc_label: str, parent_path: str, _depth: int = 0):
+        if _depth > 500:
+            return
+        tag = _strip_xml_ns(node.tag).lower()
+        # Heuristics: disc/catalog/source containers reset disc_label
+        if tag in ("disc", "catalog", "source", "volume", "media"):
+            disc_label = node.get("name") or node.get("Name") or disc_label
+        # File-like nodes
+        if tag in ("file", "f"):
+            name = node.get("name") or node.get("Name") or node.findtext("Name") or ""
+            size_raw = node.get("size") or node.get("Size") or node.findtext("Size") or "0"
+            try:
+                size = int(size_raw)
+            except ValueError:
+                size = 0
+            full_path = normalize_catalog_path(f"{parent_path}/{name}" if parent_path else name)
+            jav_id = extract_id(name)
+            if jav_id:
+                entries.append(FileEntry(
+                    source="Catalog",
+                    remote=f"catalog:{disc_label}" if disc_label else f"catalog:{path.name}",
+                    path=full_path, size=size, mod_time="", jav_id=jav_id,
+                ))
+            else:
+                skipped.append((f"catalog:{disc_label or path.name}", full_path))
+            return
+        # Folder-like: extend parent_path
+        if tag in ("folder", "dir", "directory"):
+            folder_name = node.get("name") or node.get("Name") or ""
+            parent_path = normalize_catalog_path(f"{parent_path}/{folder_name}" if parent_path else folder_name)
+        for child in node:
+            walk(child, disc_label, parent_path, _depth + 1)
+
+    walk(root, "", "")
+    return entries
+
+
+def _expand_catalog_paths(paths: list[str]) -> list[Path]:
+    """Expand any directories to their *.csv / *.xml children. Files passed through."""
+    out: list[Path] = []
+    for p in paths:
+        cp = Path(p)
+        if cp.is_dir():
+            for child in sorted(cp.iterdir()):
+                if child.suffix.lower() in (".csv", ".xml") and child.is_file():
+                    out.append(child)
+        elif cp.exists():
+            out.append(cp)
+        # silently skip missing default dir; warn for everything else
+        elif Path(p).resolve() not in {Path(d).resolve() for d in DEFAULT_CATALOG}:
+            console.print(f"[yellow]WARN: catalog path not found: {p}[/]")
+    return out
+
+
+def load_catalogs(paths: list[str], skipped: list[tuple[str, str]]) -> list[FileEntry]:
+    out: list[FileEntry] = []
+    for cp in _expand_catalog_paths(paths):
+        ext = cp.suffix.lower()
+        if ext == ".csv":
+            out.extend(load_catalog_csv(cp, skipped))
+        elif ext == ".xml":
+            out.extend(load_catalog_xml(cp, skipped))
+        else:
+            console.print(f"[yellow]WARN: unknown catalog format '{ext}' for {cp}; skipping.[/]")
+    return out
+
+
+# ---------- quick search (no cache) ----------
+
+def quick_search_remote(remote: str, source_label: str,
+                        patterns: list[str],
+                        skipped: list[tuple[str, str]]) -> list[FileEntry]:
+    """Run `rclone lsjson --include <pattern>` once per pattern. Bypass cache."""
+    out: list[FileEntry] = []
+    seen: set[tuple[str, str]] = set()
+    for pat in patterns:
+        cmd = [RCLONE_BIN, "lsjson", remote, "--files-only", "-R", "--include", pat]
+        proc = subprocess.run(cmd, capture_output=True, text=True,
+                              encoding="utf-8", errors="replace")
+        if proc.returncode != 0:
+            console.print(f"[red]rclone lsjson --include failed for {remote}:[/]\n{proc.stderr}")
+            sys.exit(proc.returncode)
+        for item in json.loads(proc.stdout or "[]"):
+            if item.get("IsDir"):
+                continue
+            path = item["Path"]
+            key = (remote, path)
+            if key in seen:
+                continue
+            seen.add(key)
+            jav_id = extract_id(Path(path).name)
+            if not jav_id:
+                skipped.append((remote, path))
+                continue
+            out.append(FileEntry(
+                source=source_label, remote=remote, path=path,
+                size=int(item.get("Size", 0)),
+                mod_time=item.get("ModTime", ""), jav_id=jav_id,
+            ))
+    return out
+
+
+def choose_search_mode(raw_queries: list[str], force_quick: bool, force_cache: bool) -> tuple[str, str]:
+    """Decide quick vs cached. Returns (mode, reason)."""
+    if force_quick and force_cache:
+        return ("cached", "both --quick and --cache passed; preferring --cache (safer)")
+    if force_quick:
+        return ("quick", "forced via --quick")
+    if force_cache:
+        return ("cached", "forced via --cache")
+    if len(raw_queries) > 1:
+        return ("cached", f"multi-query ({len(raw_queries)} IDs) — cache batches them for free")
+    if not raw_queries:
+        return ("cached", "no queries")
+    q = raw_queries[0]
+    if RANGE_RE.search(q):
+        return ("cached", "range [N-M] — too many rclone calls otherwise")
+    if "*" in q or "?" in q:
+        return ("cached", "wildcard — cache match semantics are more reliable")
+    return ("quick", "single exact ID — live lookup is fastest")
+
+
+def _escape_rclone_glob(s: str) -> str:
+    """Escape rclone filter meta-chars so a literal token isn't interpreted as a
+    glob. rclone's filter syntax treats `*`, `?`, `[`, `{` specially; brackets
+    open a char-class that fails silently if the token contains `[` or `]`."""
+    out = []
+    for ch in s:
+        if ch in r"*?[]{}\\":
+            out.append("\\" + ch)
+        else:
+            out.append(ch)
+    return "".join(out)
+
+
+def name_to_include_patterns(tokens: list[str]) -> list[str]:
+    """Build rclone --include globs for each name token (case-insensitive substring)."""
+    pats: list[str] = []
+    for t in tokens:
+        if "*" in t or "?" in t:
+            # Caller-supplied wildcard — assume they meant it.
+            pats.append(t)
+        else:
+            # Literal substring search: escape glob meta inside the token so
+            # `--name "[BD]"` searches for the literal "[BD]" not a char class.
+            pats.append(f"*{_escape_rclone_glob(t)}*")
+    return pats
+
+
+def name_match(stem: str, tokens: list[str]) -> bool:
+    """Case-insensitive: True if ANY token matches stem (substring or fnmatch glob)."""
+    low = stem.lower()
+    for t in tokens:
+        tl = t.lower()
+        if "*" in tl or "?" in tl:
+            if fnmatch.fnmatchcase(low, tl):
+                return True
+        elif tl in low:
+            return True
+    return False
+
+
+def query_to_include_patterns(raw: str) -> list[str]:
+    """Turn a search query into one or more rclone --include globs.
+    Ranges expand to individual IDs; wildcards and exact IDs map to single glob."""
+    if RANGE_RE.search(raw):
+        expanded = expand_range(raw) or []
+        out: list[str] = []
+        for e in expanded:
+            out.extend(query_to_include_patterns(e))
+        return out
+    if "*" in raw or "?" in raw:
+        return [f"{raw}*"]
+    norm = normalize_id(raw)
+    if not norm:
+        return [f"{raw}*"]
+    prefix, _, digits = norm.rpartition("-")
+    if not digits.isdigit():
+        return [f"{norm}*"]
+    n = int(digits)
+    width = max(3, len(str(n)))
+    return [f"{prefix}-{n:0{width}d}*"]
+
+
+# ---------- rclone wrappers ----------
+
+def remote_file_count(remote: str) -> int:
+    """Fast total file count via `rclone size --json`."""
+    cmd = [RCLONE_BIN, "size", "--json", remote]
+    proc = subprocess.run(cmd, capture_output=True, text=True,
+                          encoding="utf-8", errors="replace")
+    if proc.returncode != 0:
+        console.print(f"[red]rclone size failed for {remote}:[/]\n{proc.stderr}")
+        sys.exit(proc.returncode)
+    try:
+        return int(json.loads(proc.stdout).get("count", 0))
+    except (json.JSONDecodeError, ValueError):
+        return 0
+
+
+DURATION_RE = re.compile(r"^\s*(\d+)\s*([smhd])\s*$", re.IGNORECASE)
+
+
+def parse_duration(s: str) -> str | None:
+    """Validate a duration suffix (`30m`, `24h`, `7d`, `90s`). Returns the
+    normalized form rclone accepts, or None if invalid. We don't compute a
+    timedelta — we pass the suffix straight to rclone --max-age."""
+    if not s:
+        return None
+    m = DURATION_RE.match(s)
+    if not m:
+        return None
+    return f"{m.group(1)}{m.group(2).lower()}"
+
+
+def walk_remote(remote: str, source_label: str,
+                skipped: list[tuple[str, str]],
+                progress: Progress, task_id,
+                max_age: str | None = None,
+                _total_override: int | None = None) -> tuple[list[FileEntry], list[str]]:
+    """Stream files from rclone lsf, ticking progress per file.
+    If max_age is set, pass --max-age to rclone so only recently-modified files
+    are returned (incremental scan).
+    _total_override: skip the internal remote_file_count probe (caller already did it)."""
+    if max_age:
+        # Can't pre-count for an age-filtered walk — skip the size probe and
+        # let progress run on a synthetic total.
+        total = 0
+        progress.update(task_id, total=1,
+                        description=f"[cyan]{source_label}[/] {remote} (since {max_age})")
+    else:
+        if _total_override is not None:
+            total = _total_override
+        else:
+            total = remote_file_count(remote)
+            if BASIC:
+                # Caller already emitted SCAN_REMOTE_START (without total) — now we know it.
+                sys.stderr.write("SCAN_REMOTE_COUNTED " + json.dumps({
+                    "remote": remote, "total": total,
+                }) + "\n")
+                sys.stderr.flush()
+        progress.update(task_id, total=max(total, 1),
+                        description=f"[cyan]{source_label}[/] {remote}")
+    cmd = [RCLONE_BIN, "lsf", "--files-only", "-R",
+           "--format", "pst", "--separator", "\t"]
+    if max_age:
+        cmd += ["--max-age", max_age]
+    cmd.append(remote)
+    proc = subprocess.Popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE,
+                            text=True, encoding="utf-8", errors="replace")
+    entries: list[FileEntry] = []
+    local_skipped: list[str] = []
+    if proc.stdout is None:
+        raise RuntimeError("rclone stdout pipe unexpectedly None")
+    _stderr_chunks: list[str] = []
+    _stderr_thread = threading.Thread(
+        target=lambda: _stderr_chunks.append(proc.stderr.read() if proc.stderr else ""),
+        daemon=True,
+    )
+    _stderr_thread.start()
+    _cancelled = False
+    try:
+        for line in proc.stdout:
+            line = line.rstrip("\n").rstrip("\r")
+            if not line:
+                continue
+            parts = line.split("\t")
+            if len(parts) < 2:
+                continue
+            rel = parts[0]
+            try:
+                size = int(parts[1])
+            except ValueError:
+                size = 0
+            mod_time = parts[2] if len(parts) >= 3 else ""
+            jav_id = extract_id(Path(rel).name)
+            if not jav_id:
+                local_skipped.append(rel)
+                skipped.append((remote, rel))
+            else:
+                entries.append(FileEntry(
+                    source=source_label, remote=remote, path=rel,
+                    size=size, mod_time=mod_time, jav_id=jav_id,
+                ))
+            progress.advance(task_id)
+            # Every CANCEL_CHECK_INTERVAL files: check cancel flag and emit progress.
+            n = len(entries) + len(local_skipped)
+            if BASIC and n > 0 and n % CANCEL_CHECK_INTERVAL == 0:
+                if CANCEL_FLAG.exists():
+                    try:
+                        CANCEL_FLAG.unlink(missing_ok=True)
+                    except OSError:
+                        pass
+                    proc.terminate()
+                    try:
+                        proc.wait(timeout=3)
+                    except subprocess.TimeoutExpired:
+                        proc.kill()
+                    _cancelled = True
+                    break
+                sys.stderr.write("SCAN_FILE_PROGRESS " + json.dumps({
+                    "remote": remote, "label": source_label,
+                    "files": len(entries), "skipped": len(local_skipped),
+                    "total": total,
+                }) + "\n")
+                sys.stderr.flush()
+    except KeyboardInterrupt:
+        proc.terminate()
+        try:
+            proc.wait(timeout=3)
+        except subprocess.TimeoutExpired:
+            proc.kill()
+        raise
+    if _cancelled:
+        sys.stderr.write("SCAN_CANCELLED\n")
+        sys.stderr.flush()
+        sys.exit(0)
+    proc.wait()
+    _stderr_thread.join()
+    if proc.returncode != 0:
+        err = _stderr_chunks[0] if _stderr_chunks else ""
+        console.print(f"[red]rclone lsf failed for {remote}:[/]\n{err}")
+        sys.exit(proc.returncode)
+    return entries, local_skipped
+
+
+def make_progress():
+    if BASIC:
+        return BasicProgress()
+    return Progress(
+        SpinnerColumn(),
+        TextColumn("{task.description}"),
+        BarColumn(),
+        MofNCompleteColumn(),
+        TimeElapsedColumn(),
+        TextColumn("eta"),
+        TimeRemainingColumn(),
+        console=console,
+        transient=False,
+    )
+
+
+# ---------- collectors ----------
+
+def collect_with_progress(remotes_by_label: list[tuple[str, str]],
+                          skipped: list[tuple[str, str]]
+                          ) -> list[FileEntry]:
+    """Dupe-mode collect — every remote freshly walked with progress."""
+    out: list[FileEntry] = []
+    if not remotes_by_label:
+        return out
+    with make_progress() as progress:
+        tasks = {(label, r): progress.add_task(f"{label} {r}", total=1)
+                 for label, r in remotes_by_label}
+        for (label, r), tid in tasks.items():
+            entries, _ = walk_remote(r, label, skipped, progress, tid)
+            out.extend(entries)
+    return out
+
+
+def cached_collect(remotes: list[str], source_label: str,
+                   skipped: list[tuple[str, str]],
+                   cache: dict, use_cache: bool, force_update: bool,
+                   cache_meta: dict[str, dict],
+                   scan_since: str | None = None) -> list[FileEntry]:
+    """Search-mode collect with cache. Always recursive.
+    scan_since: rclone duration string (`24h`, `7d`). When set during a forced
+    update, only files modified within the window are walked and merged on top
+    of the existing cache entry; files older than the window keep their cached
+    record. If there's no prior cache entry for a remote, falls through to a
+    full scan."""
+    out: list[FileEntry] = []
+    to_scan: list[str] = []
+    to_incremental: list[tuple[str, dict]] = []  # (remote, existing_entry)
+    for r in remotes:
+        if scan_since and force_update and use_cache:
+            existing = cache["remotes"].get(r)
+            if existing:
+                to_incremental.append((r, existing))
+                continue
+            # No prior cache for this remote -> can't be incremental, fall back.
+        entry = cache["remotes"].get(r) if use_cache and not force_update else None
+        if entry:
+            age = cache_age_hours(entry["scanned_at"])
+            age_str = fmt_age(age) if age is not None else "?"
+            stale = age is not None and age > CACHE_STALE_HOURS
+            cache_meta[r] = {"cached": True, "age": age_str, "stale": stale,
+                             "file_count": len(entry["files"])}
+            for f in entry["files"]:
+                out.append(FileEntry(source=source_label, remote=r, path=f["path"],
+                                     size=f["size"], mod_time=f.get("mod_time", ""),
+                                     jav_id=f["jav_id"]))
+            for s in entry.get("skipped", []):
+                skipped.append((r, s))
+        else:
+            to_scan.append(r)
+
+    if to_scan:
+        with make_progress() as progress:
+            tids = {r: progress.add_task(f"{source_label} {r}", total=1) for r in to_scan}
+            for r_idx, r in enumerate(to_scan):
+                _total: int | None = None
+                if BASIC:
+                    # Emit SCAN_REMOTE_START immediately so the UI shows the remote name.
+                    # Then probe the file count; once known, emit SCAN_REMOTE_COUNTED so
+                    # the UI can show "N / total" without waiting for the first 100 files.
+                    sys.stderr.write("SCAN_REMOTE_START " + json.dumps({
+                        "remote": r, "label": source_label,
+                        "index": r_idx + 1, "of": len(to_scan),
+                        "total": None,
+                    }) + "\n")
+                    sys.stderr.flush()
+                    _total = remote_file_count(r)
+                    sys.stderr.write("SCAN_REMOTE_COUNTED " + json.dumps({
+                        "remote": r, "total": _total,
+                    }) + "\n")
+                    sys.stderr.flush()
+                fresh, local_skipped = walk_remote(r, source_label, skipped, progress, tids[r],
+                                                   _total_override=_total)
+                out.extend(fresh)
+                cache_meta[r] = {"cached": False, "age": "fresh", "stale": False,
+                                 "file_count": len(fresh)}
+                if use_cache:
+                    cache["remotes"][r] = {
+                        "scanned_at": datetime.now().astimezone().isoformat(),
+                        "recursive": True,
+                        "files": [{"path": e.path, "size": e.size, "mod_time": e.mod_time,
+                                   "jav_id": e.jav_id} for e in fresh],
+                        "skipped": local_skipped,
+                    }
+                if BASIC:
+                    sys.stderr.write("SCAN_PROGRESS " + json.dumps({
+                        "remote": r, "label": source_label,
+                        "files": len(fresh), "files_total": len(out),
+                    }) + "\n")
+                    sys.stderr.flush()
+
+    if to_incremental:
+        with make_progress() as progress:
+            tids = {r: progress.add_task(f"{source_label} {r} (since {scan_since})", total=1)
+                    for r, _ in to_incremental}
+            for r_idx, (r, existing) in enumerate(to_incremental):
+                if BASIC:
+                    sys.stderr.write("SCAN_REMOTE_START " + json.dumps({
+                        "remote": r, "label": source_label,
+                        "index": r_idx + 1, "of": len(to_incremental),
+                        "total": None, "incremental": True,
+                    }) + "\n")
+                    sys.stderr.flush()
+                fresh, local_skipped = walk_remote(
+                    r, source_label, skipped, progress, tids[r], max_age=scan_since,
+                )
+                # Merge: replace entries at paths we just walked, keep all others.
+                new_paths = {e.path for e in fresh}
+                old_files = [f for f in existing.get("files", [])
+                             if f["path"] not in new_paths]
+                merged_files = old_files + [
+                    {"path": e.path, "size": e.size, "mod_time": e.mod_time,
+                     "jav_id": e.jav_id} for e in fresh
+                ]
+                # Merge skipped lists (de-dupe).
+                old_skipped = set(existing.get("skipped", []))
+                old_skipped.update(local_skipped)
+                # Emit FileEntry for everything (old + new) so the caller sees the
+                # full set, not just deltas.
+                for f in merged_files:
+                    out.append(FileEntry(source=source_label, remote=r, path=f["path"],
+                                         size=f["size"], mod_time=f.get("mod_time", ""),
+                                         jav_id=f["jav_id"]))
+                for s in old_skipped:
+                    skipped.append((r, s))
+                cache_meta[r] = {
+                    "cached": False, "age": f"incremental {scan_since}",
+                    "stale": False, "file_count": len(merged_files),
+                    "added_or_updated": len(fresh),
+                }
+                if use_cache:
+                    cache["remotes"][r] = {
+                        "scanned_at": datetime.now().astimezone().isoformat(),
+                        "recursive": True,
+                        "files": merged_files,
+                        "skipped": sorted(old_skipped),
+                    }
+                if BASIC:
+                    sys.stderr.write("SCAN_PROGRESS " + json.dumps({
+                        "remote": r, "label": source_label,
+                        "files": len(fresh), "files_total": len(out),
+                        "incremental": True,
+                        "file_count": len(merged_files),
+                    }) + "\n")
+                    sys.stderr.flush()
+    return out
+
+
+# ---------- renderers ----------
+
+def render_banner(cache_meta: dict[str, dict], mode: str) -> Panel:
+    lines: list[Text] = []
+    lines.append(Text.from_markup(f"[bold]mode:[/] {mode}"))
+    if cache_meta:
+        for r, m in cache_meta.items():
+            if m["cached"]:
+                tag = f"CACHED {m['age']}" + (" STALE" if m["stale"] else "")
+                style = "yellow" if m["stale"] else "dim"
+            else:
+                tag = "FRESH SCAN"
+                style = "green"
+            lines.append(Text.from_markup(
+                f"  [white]{r}[/]  [{style}]{tag}[/]  [dim]({m['file_count']} files)[/]"
+            ))
+    body = Text("\n").join(lines)
+    return Panel(body, title="rc-jav", title_align="left", border_style="blue")
+
+
+def render_search(matches: dict[str, list[FileEntry]], queries: list[str],
+                  cache_meta: dict[str, dict]) -> None:
+    console.print(render_banner(cache_meta, mode="search"))
+    for q in queries:
+        hits = matches.get(q, [])
+        if not hits:
+            console.print(f"[bold red][{q}] NOT FOUND[/]")
+            console.print()
+            continue
+        title = f"[bold green][{q}] {len(hits)} hit(s)[/]"
+        tbl = Table(title=title, title_justify="left", show_lines=False,
+                    border_style="green", expand=True)
+        tbl.add_column("Source", style="yellow", no_wrap=True)
+        tbl.add_column("Cache", no_wrap=True)
+        tbl.add_column("File", style="bold", overflow="fold")
+        tbl.add_column("Size", justify="right", no_wrap=True)
+        tbl.add_column("Path", style="dim", overflow="fold")
+        for e in sorted(hits, key=lambda x: (x.jav_id, x.path.lower())):
+            meta = cache_meta.get(e.remote, {})
+            if meta.get("cached"):
+                cache_tag = "[yellow][CACHED-STALE][/]" if meta.get("stale") else "[dim][CACHED][/]"
+            else:
+                cache_tag = "[green][FRESH][/]"
+            tbl.add_row(
+                e.source, cache_tag, Path(e.path).name,
+                f"{human_size(e.size)}\n[dim]({e.size:,} B)[/]",
+                e.full_path,
+            )
+        console.print(tbl)
+        console.print()
+
+
+def render_name_matches(hits: list[FileEntry], tokens: list[str],
+                        cache_meta: dict[str, dict]) -> None:
+    title = f"[bold green]Name match {tokens} — {len(hits)} hit(s)[/]"
+    if not hits:
+        console.print(f"[bold red]Name match {tokens} — NOT FOUND[/]")
+        return
+    tbl = Table(title=title, title_justify="left", show_lines=False,
+                border_style="green", expand=True)
+    tbl.add_column("Source", style="yellow", no_wrap=True)
+    tbl.add_column("Cache", no_wrap=True)
+    tbl.add_column("ID", style="bold cyan", no_wrap=True)
+    tbl.add_column("File", style="bold", overflow="fold")
+    tbl.add_column("Size", justify="right", no_wrap=True)
+    tbl.add_column("Path", style="dim", overflow="fold")
+    for e in sorted(hits, key=lambda x: (x.jav_id, x.path.lower())):
+        meta = cache_meta.get(e.remote, {})
+        if meta.get("cached"):
+            cache_tag = "[yellow][CACHED-STALE][/]" if meta.get("stale") else "[dim][CACHED][/]"
+        else:
+            cache_tag = "[green][FRESH][/]"
+        tbl.add_row(
+            e.source, cache_tag, e.jav_id, Path(e.path).name,
+            f"{human_size(e.size)}\n[dim]({e.size:,} B)[/]",
+            e.full_path,
+        )
+    console.print(tbl)
+    console.print()
+
+
+def render_name_matches_plain(hits: list[FileEntry], tokens: list[str],
+                              cache_meta: dict[str, dict]) -> str:
+    lines: list[str] = []
+    if not hits:
+        lines.append(ansi(f"Name match {tokens} — NOT FOUND", ANSI_RED))
+        return "\n".join(lines)
+    lines.append(ansi(f"Name match {tokens} — {len(hits)} hit(s)", ANSI_GREEN + ANSI_BOLD))
+    for e in sorted(hits, key=lambda x: (x.jav_id, x.path.lower())):
+        meta = cache_meta.get(e.remote, {})
+        if meta.get("cached"):
+            tag = ansi("[CACHED-STALE]", ANSI_YELLOW) if meta.get("stale") else ansi("[CACHED]", ANSI_DIM)
+        else:
+            tag = ansi("[FRESH]", ANSI_GREEN)
+        src = ansi(e.source, ANSI_YELLOW)
+        lines.append(f"  {src}  {tag}  {ansi(e.jav_id, ANSI_CYAN)}")
+        lines.append(ansi(f"    file: {Path(e.path).name}", ANSI_BOLD))
+        lines.append(f"    size: {human_size(e.size)} ({e.size:,} bytes)")
+        lines.append(ansi(f"    path: {e.full_path}", ANSI_DIM))
+    return "\n".join(lines)
+
+
+def render_dupes(dupes: dict[str, list[FileEntry]],
+                 skipped: list[tuple[str, str]],
+                 variant_alerts: dict[str, list[FileEntry]] | None = None) -> None:
+    if not dupes:
+        console.print(Panel("[bold green]No duplicates found.[/]",
+                            border_style="green"))
+    else:
+        console.print(f"[bold]Found {len(dupes)} duplicate ID group(s):[/]")
+        console.print()
+        total_reclaim = 0
+        for jav_id in sorted(dupes):
+            entries = dupes[jav_id]
+            keep = decide_keep(entries)
+            tbl = Table(title=f"[bold][{jav_id}][/]", title_justify="left",
+                        show_lines=False, border_style="magenta", expand=True)
+            tbl.add_column("Action", no_wrap=True)
+            tbl.add_column("Source", style="yellow", no_wrap=True)
+            tbl.add_column("Size", justify="right", no_wrap=True)
+            tbl.add_column("Path", overflow="fold")
+            for e in sorted(entries, key=lambda x: (x.source != "Source", x.source == "Catalog", -x.size)):
+                if e.source == "Catalog":
+                    action = "[cyan]CATALOG[/]"
+                elif e is keep:
+                    action = "[green]KEEP[/]"
+                else:
+                    action = "[red]DELETE?[/]"
+                    total_reclaim += e.size
+                tbl.add_row(action, e.source,
+                        f"{human_size(e.size)}\n[dim]({e.size:,} B)[/]",
+                        e.full_path)
+            console.print(tbl)
+            console.print()
+        console.print(Panel(
+            f"[bold]Potential space reclaim if all DELETE? removed: "
+            f"[red]{human_size(total_reclaim)}[/][/]",
+            border_style="red"))
+    if skipped:
+        console.print()
+        tbl = Table(title=f"[dim]Skipped {len(skipped)} file(s) with no parseable ID[/]",
+                    title_justify="left", show_lines=False, border_style="dim", expand=True)
+        tbl.add_column("Remote", style="dim", no_wrap=True)
+        tbl.add_column("Path", style="dim", overflow="fold")
+        for remote, path in skipped[:50]:
+            tbl.add_row(remote, path)
+        if len(skipped) > 50:
+            tbl.add_row("[dim]…[/]", f"[dim]+{len(skipped) - 50} more[/]")
+        console.print(tbl)
+    if variant_alerts:
+        console.print()
+        console.print(Panel(
+            f"[bold yellow]⚠ {len(variant_alerts)} variant alert(s) — manual review recommended[/]",
+            border_style="yellow"))
+        for bare_id, entries in sorted(variant_alerts.items()):
+            tbl = Table(title=f"[bold yellow][{bare_id}] — bare + variant coexist[/]",
+                        title_justify="left", show_lines=False, border_style="yellow", expand=True)
+            tbl.add_column("ID", style="yellow", no_wrap=True)
+            tbl.add_column("Size", justify="right", no_wrap=True)
+            tbl.add_column("Path", overflow="fold")
+            for e in sorted(entries, key=lambda x: x.full_path):
+                eid = extract_id(Path(e.path).name) or e.jav_id
+                tbl.add_row(eid, human_size(e.size), e.full_path)
+            console.print(tbl)
+            console.print()
+
+
+def decide_keep_with_reason(entries: list[FileEntry]) -> tuple[FileEntry, dict[str, str]]:
+    """Pick KEEP candidate and explain the first ranking rule that settled it.
+
+    Catalog entries are excluded — they are offline/informational.
+
+    Ranking (descending priority, configurable via keep_ranking in config.json):
+      1. Video files in ordered priority folders outrank other rclone entries.
+      2. Source entries outrank Target entries when no priority-folder video exists.
+      3. Non-.ts files outrank .ts files when a duplicate group has both.
+      4. Largest file size. If sizes are within size_tolerance_mib, treated as equal
+         and format preference is consulted instead.
+      5. Format preference: ordered list of extensions (e.g. mkv > mp4 > wmv > avi).
+      6. Tie-break: has resolution tag in filename ([1080p], [2160p], [720p], [480p]).
+      7. Tie-break: longer filename (more metadata = more descriptive).
+    """
+    ranking = _KEEP_RANKING or {}
+    tolerance_bytes = int(float(ranking.get("size_tolerance_mib") or 0) * 1024 * 1024)
+    priority_folders: list[str] = [
+        str(folder).strip() for folder in
+        (ranking.get("priority_folders") or DEFAULT_KEEP_RANKING["priority_folders"])
+        if str(folder).strip()
+    ]
+    fmt_order: list[str] = list(
+        ranking.get("format_preference") or DEFAULT_KEEP_RANKING["format_preference"]
+    )
+    use_res_tag: bool = ranking.get("tiebreak_res_tag", True)
+    use_longer_name: bool = ranking.get("tiebreak_longer_name", True)
+
+    rclone = [e for e in entries if e.source != "Catalog"]
+
+    def _priority_folder_rank(e: FileEntry) -> int | None:
+        if Path(e.path).suffix.lower() not in _VIDEO_EXTS:
+            return None
+        # A root can be cq:JAV while the favored folder is a child path, or the
+        # supplied root can itself end in that folder. Match across full_path.
+        full_path = e.full_path.replace("\\", "/").strip("/").lower()
+        segments = [segment for segment in full_path.split("/") if segment]
+        for index, raw_folder in enumerate(priority_folders):
+            folder = raw_folder.replace("\\", "/").strip("/").lower()
+            if not folder:
+                continue
+            if "/" in folder or ":" in folder:
+                framed = f"/{full_path}/"
+                if full_path == folder or full_path.startswith(folder + "/") or f"/{folder}/" in framed:
+                    return index
+            elif folder in segments:
+                return index
+        return None
+
+    prioritized = [(rank, e) for e in rclone if (rank := _priority_folder_rank(e)) is not None]
+    best_priority = min((rank for rank, _ in prioritized), default=None)
+    priority_videos = [e for rank, e in prioritized if rank == best_priority]
+    pool_priority = [e for e in rclone if e.source == "Source"]
+    reason = {"code": "fallback", "summary": "First remaining duplicate candidate"}
+    if priority_videos:
+        pool = priority_videos
+        reason = {
+            "code": "vip_folder",
+            "summary": f"VIP folder: {priority_folders[best_priority]}",
+        }
+    elif pool_priority:
+        pool = pool_priority
+        reason = {"code": "source", "summary": "Source copy outranks target copies"}
+    else:
+        pool = rclone if rclone else entries
+
+    # Transport streams often inflate size without being the better keeper.
+    preferred_containers = [
+        e for e in pool if Path(e.path).suffix.lower() not in _LOWEST_KEEP_PRIORITY_EXTS
+    ]
+    if preferred_containers and len(preferred_containers) != len(pool):
+        pool = preferred_containers
+        reason = {"code": "container", "summary": "Non-TS video outranks transport stream"}
+
+    # Step 1: narrow to within size tolerance of the maximum
+    max_size = max(e.size for e in pool)
+    candidates = [e for e in pool if max_size - e.size <= tolerance_bytes]
+
+    if len(candidates) == 1:
+        if len(pool) > 1 and reason["code"] not in {"vip_folder", "source", "container"}:
+            reason = {"code": "size", "summary": "Largest file after ranking rules"}
+        return candidates[0], reason
+
+    # Step 2: format preference (lower index in fmt_order = higher priority)
+    def _fmt_rank(e: FileEntry) -> int:
+        ext = Path(e.path).suffix.lower().lstrip(".")
+        try:
+            return fmt_order.index(ext)          # lower = better
+        except ValueError:
+            return len(fmt_order)                # unknown = lowest
+
+    best_fmt = min(_fmt_rank(e) for e in candidates)
+    by_fmt = [e for e in candidates if _fmt_rank(e) == best_fmt]
+    if len(by_fmt) != len(candidates):
+        ext = Path(by_fmt[0].path).suffix.lower().lstrip(".").upper() or "preferred format"
+        reason = {"code": "format", "summary": f"Format preference: {ext}"}
+    candidates = by_fmt
+
+    if len(candidates) == 1:
+        return candidates[0], reason
+
+    # Step 3: resolution tag tie-break
+    if use_res_tag:
+        tagged = [e for e in candidates if _RES_LABEL_RE.search(Path(e.path).name)]
+        if tagged:
+            if len(tagged) != len(candidates):
+                reason = {"code": "resolution_tag", "summary": "Filename has a resolution tag"}
+            candidates = tagged
+
+    if len(candidates) == 1:
+        return candidates[0], reason
+
+    # Step 4: longer filename tie-break
+    if use_longer_name:
+        keep = max(candidates, key=lambda e: len(Path(e.path).name))
+        return keep, {"code": "filename", "summary": "Longer filename tie-break"}
+
+    return candidates[0], reason
+
+
+def decide_keep(entries: list[FileEntry]) -> FileEntry:
+    """Pick KEEP candidate for duplicate output."""
+    return decide_keep_with_reason(entries)[0]
+
+
+def find_dupes(entries: Iterable[FileEntry]) -> dict[str, list[FileEntry]]:
+    """Group entries by jav_id. A group is a dupe only if it has >=2 non-Catalog entries."""
+    groups: dict[str, list[FileEntry]] = {}
+    for e in entries:
+        # Re-evaluate duplicate keys from the current filename rules. Cached
+        # entries may predate a new part detector such as `.1of2`; treating those
+        # stale base IDs as duplicate files would produce risky delete hints.
+        key = extract_id(Path(e.path).name) or e.jav_id
+        groups.setdefault(key, []).append(e)
+    out: dict[str, list[FileEntry]] = {}
+    for k, v in groups.items():
+        rclone_count = sum(1 for e in v if e.source != "Catalog")
+        if rclone_count >= 2:
+            out[k] = v
+    return out
+
+
+_SUSPICIOUS_MULTIPART_TAIL_RE = re.compile(
+    r"(?:^|[-_.\s])(?:p|pt|part|cd|disc|ep|episode|vol|volume|scene)[-_.\s]*([a-d]|\d{1,2})(?:$|[-_.\s\[])"
+    r"|(?:^|[-_.\s])([a-d]|\d{1,2})(?:$|\s*\[)",
+    re.IGNORECASE,
+)
+
+
+def describe_dupe_risks(jav_id: str, entries: list[FileEntry]) -> list[dict[str, str]]:
+    """Flag duplicate groups that deserve manual review before deletion."""
+    rclone = [e for e in entries if e.source != "Catalog"]
+    risks: list[dict[str, str]] = []
+    if "#part" not in jav_id and len(rclone) >= 3:
+        risks.append({
+            "code": "large_same_id_group",
+            "summary": f"{len(rclone)} files share this base ID; review for unrecognized parts before deleting.",
+        })
+
+    suspicious: list[str] = []
+    for e in rclone:
+        stem = Path(e.path).stem
+        base_match = PRIMARY_ID_RE.match(stem) or COMPOUND_ID_RE.match(stem) or FALLBACK_ID_RE.match(stem)
+        if not base_match:
+            continue
+        tail = _RESOLUTION_TAG_RE.sub("", stem[base_match.end():]).strip()
+        if _SUSPICIOUS_MULTIPART_TAIL_RE.search(tail):
+            suspicious.append(Path(e.path).name)
+    if suspicious and "#part" not in jav_id:
+        samples = ", ".join(suspicious[:3])
+        more = " ..." if len(suspicious) > 3 else ""
+        risks.append({
+            "code": "part_like_suffix",
+            "summary": f"Part-like suffixes still share the base ID: {samples}{more}",
+        })
+    return risks
+
+
+def find_variant_alerts(
+    entries: Iterable[FileEntry],
+) -> dict[str, list[FileEntry]]:
+    """Detect IDs where a bare form and a lowercase-variant form coexist.
+
+    Example: both ``IBW-902.mp4`` and ``IBW-902z.mp4`` are present.
+    They are different products — not dupes — but their coexistence is
+    suspicious and warrants manual comparison.
+
+    Returns {bare_id: [all entries whose re-evaluated ID matches bare or variant]}.
+    Only bare IDs that have at least one variant sibling are included.
+    """
+    index: dict[str, list[FileEntry]] = {}
+    for e in entries:
+        key = extract_id(Path(e.path).name) or e.jav_id
+        index.setdefault(key, []).append(e)
+
+    alerts: dict[str, list[FileEntry]] = {}
+    for jav_id in index:
+        if "#" in jav_id:
+            continue  # skip multipart IDs
+        m = _VARIANT_SUFFIX_RE.match(jav_id)
+        if not m:
+            continue
+        bare = m.group(1)
+        if bare in index:
+            # Merge bare + variant entries under the bare key.
+            if bare not in alerts:
+                alerts[bare] = list(index[bare])
+            alerts[bare].extend(index[jav_id])
+    return alerts
+
+
+# ---------- library issues (non-canonical filenames) ----------
+
+def _bracket_to_canonical(filename: str) -> str:
+    """[REAL-779].mp4 → REAL-779.mp4  |  [HODV-21076] Saki [1080p].mkv → HODV-21076 Saki [1080p].mkv"""
+    stem = Path(filename).stem
+    suffix = Path(filename).suffix
+    bm = _BRACKET_ID_RE.match(stem)
+    if not bm:
+        return filename
+    inner = bm.group(1).strip()
+    rest = stem[bm.end():].strip()
+    new_stem = f"{inner} {rest}".strip() if rest else inner
+    return f"{new_stem}{suffix}"
+
+
+def _nohyphen_to_canonical(filename: str) -> str:
+    """MVSD312 [576p].avi → MVSD-312 [576p].avi"""
+    stem = Path(filename).stem
+    suffix = Path(filename).suffix
+    m = _NOHYPHEN_ID_RE.match(stem)
+    if not m:
+        return filename
+    prefix = m.group(1).upper()
+    num_str = m.group(2)
+    rest = stem[m.end():]
+    return f"{prefix}-{num_str}{rest}{suffix}"
+
+
+def find_library_issues(cache: dict) -> dict:
+    """Scan cache for files with non-canonical names.
+
+    Returns:
+        {"bracket_names": [...], "nohyphen_names": [...]}
+    Each entry: {remote, path, size, mod_time, jav_id, canonical_name, issue}
+    """
+    bracket: list[dict] = []
+    nohyphen: list[dict] = []
+    for remote, remote_data in cache.get("remotes", {}).items():
+        for f in remote_data.get("files", []):
+            fname = Path(f["path"]).name
+            stem = Path(fname).stem
+            if stem.startswith("[") and _BRACKET_ID_RE.match(stem):
+                bracket.append({
+                    "remote": remote,
+                    "path": f["path"],
+                    "size": f.get("size", 0),
+                    "size_human": human_size(f.get("size", 0)),
+                    "mod_time": f.get("mod_time", ""),
+                    "jav_id": f.get("jav_id", ""),
+                    "canonical_name": _bracket_to_canonical(fname),
+                    "issue": "bracket_id",
+                })
+            elif (not PRIMARY_ID_RE.match(stem)
+                  and not COMPOUND_ID_RE.match(stem)
+                  and not FALLBACK_ID_RE.match(stem)
+                  and _NOHYPHEN_ID_RE.match(stem)):
+                nohyphen.append({
+                    "remote": remote,
+                    "path": f["path"],
+                    "size": f.get("size", 0),
+                    "size_human": human_size(f.get("size", 0)),
+                    "mod_time": f.get("mod_time", ""),
+                    "jav_id": f.get("jav_id", ""),
+                    "canonical_name": _nohyphen_to_canonical(fname),
+                    "issue": "nohyphen_id",
+                })
+    return {"bracket_names": bracket, "nohyphen_names": nohyphen}
+
+
+def rename_file_in_remote(
+    remote: str,
+    old_rel_path: str,
+    new_rel_path: str,
+    cache: dict,
+    rclone_bin: str = "rclone",
+    save: bool = True,
+) -> dict:
+    """Rename one file via rclone moveto and patch cache.json.
+
+    Returns {"ok": True, "old_path": ..., "new_path": ...}
+         or {"ok": False, "error": ..., "conflict": bool}
+
+    Pass save=False when batching — caller is responsible for calling save_cache() once.
+    """
+    sep = "" if remote.endswith("/") else "/"
+    old_full = f"{remote}{sep}{old_rel_path}"
+    new_full = f"{remote}{sep}{new_rel_path}"
+
+    # Collision check — does target already exist?
+    check = subprocess.run(
+        [rclone_bin, "lsf", new_full],
+        capture_output=True, text=True,
+    )
+    if check.returncode == 0 and check.stdout.strip():
+        return {"ok": False, "error": f"Target already exists: {new_full}", "conflict": True}
+
+    # Perform rename
+    result = subprocess.run(
+        [rclone_bin, "moveto", old_full, new_full],
+        capture_output=True, text=True,
+    )
+    if result.returncode != 0:
+        return {"ok": False, "error": (result.stderr or result.stdout).strip(), "conflict": False}
+
+    # Patch cache — update path + jav_id for the renamed entry
+    remote_data = cache.get("remotes", {}).get(remote)
+    if remote_data:
+        for f in remote_data.get("files", []):
+            if f["path"] == old_rel_path:
+                f["path"] = new_rel_path
+                f["jav_id"] = extract_id(Path(new_rel_path).name) or f["jav_id"]
+                break
+        remote_data["skipped"] = [s for s in remote_data.get("skipped", []) if s != old_rel_path]
+        if save:
+            save_cache(cache)
+
+    return {"ok": True, "old_path": old_full, "new_path": new_full}
+
+
+def rename_files_batch(
+    renames: list[dict],
+    cache: dict,
+    rclone_bin: str = "rclone",
+) -> list[dict]:
+    """Rename multiple files, writing cache once at the end.
+
+    Each item in renames: {remote, old_path, new_path}
+    Returns list of per-file results with old_path/new_path echoed back.
+    """
+    results = []
+    cache_dirty = False
+    for r in renames:
+        res = rename_file_in_remote(
+            r["remote"], r["old_path"], r["new_path"],
+            cache, rclone_bin=rclone_bin, save=False,
+        )
+        res["old_path"] = r["old_path"]
+        res["new_path"] = r["new_path"]
+        results.append(res)
+        if res["ok"]:
+            cache_dirty = True
+    if cache_dirty:
+        save_cache(cache)
+    return results
+
+
+# ---------- plain renderers (--basic) ----------
+
+def render_banner_plain(cache_meta: dict[str, dict], mode: str) -> str:
+    lines = [ansi(f"=== rc-jav ({mode}) ===", ANSI_BOLD)]
+    for r, m in cache_meta.items():
+        if m["cached"]:
+            tag = f"CACHED {m['age']}" + (" STALE" if m["stale"] else "")
+            tag_c = ansi(tag, ANSI_YELLOW if m["stale"] else ANSI_DIM)
+        else:
+            tag_c = ansi("FRESH SCAN", ANSI_GREEN)
+        count_str = ansi(f"({m['file_count']} files)", ANSI_DIM)
+        lines.append(f"  {r}  {tag_c}  {count_str}")
+    return "\n".join(lines)
+
+
+def render_search_plain(matches: dict[str, list[FileEntry]], queries: list[str],
+                        cache_meta: dict[str, dict]) -> str:
+    lines: list[str] = []
+    if cache_meta:
+        lines.append(render_banner_plain(cache_meta, "search"))
+        lines.append("")
+    for q in queries:
+        hits = matches.get(q, [])
+        if not hits:
+            lines.append(ansi(f"[{q}] NOT FOUND", ANSI_RED))
+            lines.append("")
+            continue
+        lines.append(ansi(f"[{q}] {len(hits)} hit(s)", ANSI_GREEN + ANSI_BOLD))
+        for e in sorted(hits, key=lambda x: (x.jav_id, x.path.lower())):
+            meta = cache_meta.get(e.remote, {})
+            if meta.get("cached"):
+                tag = ansi("[CACHED-STALE]", ANSI_YELLOW) if meta.get("stale") else ansi("[CACHED]", ANSI_DIM)
+            else:
+                tag = ansi("[FRESH]", ANSI_GREEN)
+            src = ansi(e.source, ANSI_YELLOW)
+            lines.append(f"  {src}  {tag}")
+            lines.append(ansi(f"    file: {Path(e.path).name}", ANSI_BOLD))
+            lines.append(f"    size: {human_size(e.size)} ({e.size:,} bytes)")
+            lines.append(ansi(f"    path: {e.full_path}", ANSI_DIM))
+        lines.append("")
+    return "\n".join(lines)
+
+
+# ---------- file outputs ----------
+
+def render_dupes_plain(dupes, skipped, variant_alerts=None) -> str:
+    lines: list[str] = []
+    if not dupes:
+        lines.append(ansi("No duplicates found.", ANSI_GREEN))
+    else:
+        lines.append(ansi(f"Found {len(dupes)} duplicate ID group(s):", ANSI_BOLD))
+        lines.append("")
+        total_reclaim = 0
+        for jav_id in sorted(dupes):
+            entries = dupes[jav_id]
+            keep = decide_keep(entries)
+            lines.append(ansi(f"[{jav_id}]", ANSI_BOLD))
+            for e in sorted(entries, key=lambda x: (x.source != "Source", x.source == "Catalog", -x.size)):
+                if e.source == "Catalog":
+                    mark = ansi("CATALOG ", ANSI_CYAN)
+                elif e is keep:
+                    mark = ansi("KEEP    ", ANSI_GREEN)
+                else:
+                    mark = ansi("DELETE? ", ANSI_RED)
+                    total_reclaim += e.size
+                src = ansi(f"{e.source:>8}", ANSI_YELLOW)
+                size_str = f"{human_size(e.size)} ({e.size:,} B)"
+                lines.append(f"  {mark} {src}  {size_str:>26}  {e.full_path}")
+            lines.append("")
+        lines.append(ansi(f"Potential space reclaim if all DELETE? removed: {human_size(total_reclaim)}", ANSI_BOLD))
+    if skipped:
+        lines.append("")
+        lines.append(ansi(f"Skipped {len(skipped)} file(s) with no parseable ID:", ANSI_DIM))
+        for remote, path in skipped[:50]:
+            lines.append(ansi(f"  {remote}  {path}", ANSI_DIM))
+        if len(skipped) > 50:
+            lines.append(ansi(f"  ... +{len(skipped) - 50} more", ANSI_DIM))
+    if variant_alerts:
+        lines.append("")
+        lines.append(ansi(f"⚠ {len(variant_alerts)} variant alert(s) — manual review required:", ANSI_YELLOW + ANSI_BOLD))
+        for bare_id, entries in sorted(variant_alerts.items()):
+            lines.append(ansi(f"  [{bare_id}] bare + variant coexist", ANSI_YELLOW))
+            for e in sorted(entries, key=lambda x: x.full_path):
+                eid = extract_id(Path(e.path).name) or e.jav_id
+                lines.append(f"    {ansi(eid, ANSI_YELLOW)}  {human_size(e.size):>10}  {e.full_path}")
+    return "\n".join(lines)
+
+
+def write_txt(path: Path, dupes, skipped):
+    path.write_text(render_dupes_plain(dupes, skipped), encoding="utf-8")
+
+
+def write_csv(path: Path, dupes):
+    with path.open("w", newline="", encoding="utf-8") as f:
+        w = csv.writer(f)
+        w.writerow(["jav_id", "action", "source", "remote", "path", "full_path",
+                    "size_bytes", "size_human", "mod_time"])
+        for jav_id in sorted(dupes):
+            entries = dupes[jav_id]
+            keep = decide_keep(entries)
+            for e in entries:
+                if e.source == "Catalog":
+                    action = "CATALOG"
+                elif e is keep:
+                    action = "KEEP"
+                else:
+                    action = "DELETE?"
+                w.writerow([jav_id, action, e.source,
+                            e.remote, e.path, e.full_path, e.size, human_size(e.size), e.mod_time])
+
+
+def describe_skipped_id(remote: str, path: str) -> dict[str, str]:
+    """Explain a common reason a path did not yield an ID."""
+    name = Path((path or "").replace("\\", "/")).name
+    reason = "No supported JAV ID at filename start"
+    hint = "Rename with a leading ID such as ABC-123 or add an ID normalizer/site-specific source."
+    if re.match(r"^\[[A-Za-z0-9-]+-\d+\]", name):
+        reason = "ID is wrapped in leading brackets"
+        hint = "Remove the leading brackets so the filename starts with the ID."
+    elif re.match(r"^[A-Za-z][A-Za-z0-9]+[\u2010-\u2015]\d+", name):
+        reason = "ID uses a non-ASCII dash"
+        hint = "Replace the separator with a normal hyphen."
+    elif re.match(r"^[A-Za-z][A-Za-z0-9]+\d+", name):
+        reason = "ID prefix and number have no hyphen"
+        hint = "Insert the ID hyphen, for example ABC-123."
+    return {"remote": remote, "path": path, "name": name, "reason": reason, "hint": hint}
+
+
+def dupes_to_obj(dupes, skipped, variant_alerts=None) -> dict:
+    out = {"groups": {}, "skipped": [describe_skipped_id(r, p) for r, p in skipped],
+           "variant_alerts": []}
+    for jav_id in sorted(dupes):
+        entries = dupes[jav_id]
+        keep, keep_reason = decide_keep_with_reason(entries)
+        out["groups"][jav_id] = {
+            "keep": asdict(keep) | {"full_path": keep.full_path, "size_human": human_size(keep.size)},
+            "keep_reason": keep_reason,
+            "risks": describe_dupe_risks(jav_id, entries),
+            "delete_candidates": [asdict(e) | {"full_path": e.full_path, "size_human": human_size(e.size)}
+                                  for e in entries
+                                  if e is not keep and e.source != "Catalog"],
+            "catalog": [asdict(e) | {"full_path": e.full_path, "size_human": human_size(e.size)}
+                        for e in entries if e.source == "Catalog"],
+        }
+    for bare_id, entries in sorted((variant_alerts or {}).items()):
+        out["variant_alerts"].append({
+            "bare_id": bare_id,
+            "files": [
+                asdict(e) | {"full_path": e.full_path, "size_human": human_size(e.size),
+                             "detected_id": extract_id(Path(e.path).name) or e.jav_id}
+                for e in sorted(entries, key=lambda x: x.full_path)
+            ],
+        })
+    return out
+
+
+def write_json(path: Path, dupes, skipped, variant_alerts=None):
+    path.write_text(json.dumps(dupes_to_obj(dupes, skipped, variant_alerts), indent=2), encoding="utf-8")
+
+
+# ---------- main ----------
+
+def main():
+    ap = argparse.ArgumentParser(description="Report duplicate JAV files across rclone remotes (read-only).")
+    ap.add_argument("--source", "-s", action="append", default=[], metavar="REMOTE",
+                    help="Source remote path (priority — wins dupes regardless of size). Repeatable.")
+    ap.add_argument("--target", "-t", action="append", default=[], metavar="REMOTE",
+                    help="Target remote path (non-priority — largest size wins among targets). Repeatable.")
+    ap.add_argument("--format", choices=["console", "txt", "csv", "json", "all"],
+                    default="console")
+    ap.add_argument("--output-dir", default="./reports", help="Where to write txt/csv/json.")
+    ap.add_argument("--no-color", action="store_true")
+    ap.add_argument("--rclone-bin", default="rclone",
+                    help="Path to rclone executable (default: 'rclone' on PATH).")
+    ap.add_argument("--search", action="append", default=[], metavar="ID",
+                    help="Search mode: look up a JAV ID (e.g. SSIS-001). Repeatable. "
+                         "If no --source/--target given, default target is used.")
+    ap.add_argument("--name", action="append", default=[], metavar="STR",
+                    help="Substring/glob search against filename. Case-insensitive. "
+                         "Repeatable; OR semantics (any token match = hit). "
+                         "Supports * and ? wildcards. Use quotes for spaces.")
+    ap.add_argument("--update", "-u", action="store_true",
+                    help="Search mode: force re-scan and overwrite cache for requested remotes.")
+    ap.add_argument("--no-cache", action="store_true",
+                    help="Search mode: bypass cache entirely (no read, no write).")
+    ap.add_argument("--quick", "-q", action="store_true",
+                    help="Force quick mode: skip cache, query rclone directly with --include glob. "
+                         "Default is auto: single exact IDs use quick, wildcards/ranges/multi use cached.")
+    ap.add_argument("--cache", action="store_true",
+                    help="Force cached mode (opposite of --quick).")
+    ap.add_argument("--save", action="store_true",
+                    help="Persist the --source / --target / --catalog values you passed "
+                         "as new defaults in config.json next to the script. "
+                         "Only keys you explicitly passed are saved.")
+    ap.add_argument("--scan", action="store_true",
+                    help="Walk configured remotes, refresh cache, exit. No search/dupe output. "
+                         "Default scope: DEFAULT_TARGET. Override with --source/--target. "
+                         "Always overwrites cache. Suitable for Task Scheduler / cron.")
+    ap.add_argument("--scan-since", metavar="DURATION",
+                    help="Incremental scan: only walk files modified within DURATION "
+                         "(e.g. 24h, 7d, 30m, 90s). Merges new/changed entries on top of "
+                         "the existing cache; old entries are preserved. Falls back to a "
+                         "full scan if there's no prior cache for a remote. Requires --scan.")
+    ap.add_argument("--catalog", action="append", default=[], metavar="PATH",
+                    help="Path to a WinCatalog CSV or XML export. Repeatable. "
+                         "Listed under 'Catalog' in results (informational, never KEEP/DELETE?).")
+    ap.add_argument("--part-pattern", action="append", default=[], metavar="REGEX",
+                    help="Extra multipart filename regex. Repeatable; first capture group must be the part number. "
+                         "Patterns run against the filename stem after built-in part detectors.")
+    ap.add_argument("--library-issues", action="store_true",
+                    help="Report non-canonical filenames (bracket-wrapped IDs, no-hyphen IDs). "
+                         "Reads from cache. Outputs JSON when --format json, plain otherwise.")
+    ap.add_argument("--rename-file", action="store_true",
+                    help="Rename one file in a remote and patch cache. "
+                         "Requires --remote, --old-path, --new-path. Outputs JSON.")
+    ap.add_argument("--rename-files-batch", action="store_true",
+                    help="Rename multiple files in one call, writing cache once. "
+                         "Reads JSON array of {remote, old_path, new_path} from stdin. Outputs JSON.")
+    ap.add_argument("--remote", metavar="REMOTE",
+                    help="Remote path root for --rename-file (e.g. cq:JAV).")
+    ap.add_argument("--old-path", metavar="PATH",
+                    help="Relative path of the file to rename (within --remote).")
+    ap.add_argument("--new-path", metavar="PATH",
+                    help="New relative path after rename (within --remote).")
+    ap.add_argument("--basic", action="store_true",
+                    help="Plain text output, no rich tables/panels/progress bars. "
+                         "Useful for piping or low-bandwidth terminals.")
+    ap.add_argument("--clearjav", action="store_true",
+                    help="Shortcut: use DEFAULT_SOURCE as --source and DEFAULT_TARGET as --target, "
+                         "Equivalent to "
+                         "`--source cq:personal-files/ClearJAV --target cq:personal-files/JAV/TMP`.")
+    args = ap.parse_args()
+
+    global RCLONE_BIN, console, BASIC, DEFAULT_SOURCE, DEFAULT_TARGET, DEFAULT_CATALOG
+    RCLONE_BIN = args.rclone_bin
+    BASIC = args.basic or args.format == "json"
+
+    # Apply persisted config overrides BEFORE defaults are consulted.
+    cfg = load_config()
+    if "default_source" in cfg:
+        DEFAULT_SOURCE = list(cfg["default_source"])
+    if "default_target" in cfg:
+        DEFAULT_TARGET = list(cfg["default_target"])
+    if "default_catalog" in cfg:
+        DEFAULT_CATALOG = list(cfg["default_catalog"])
+    global _KEEP_RANKING
+    _KEEP_RANKING = cfg.get("keep_ranking") or {}
+    part_patterns = list(cfg.get("part_patterns") or []) + list(args.part_pattern)
+    pattern_errors = configure_part_patterns(part_patterns)
+    if pattern_errors:
+        for err in pattern_errors:
+            console.print(f"[red]invalid part pattern:[/] {err}")
+        sys.exit(2)
+
+    # --save: persist explicitly-passed values, exit.
+    if args.save:
+        if not (args.source or args.target or args.catalog or args.part_pattern):
+            console.print("[red]--save needs at least one --source/--target/--catalog/--part-pattern value to persist.[/]")
+            sys.exit(2)
+        new_cfg = dict(cfg)
+        if args.source:
+            new_cfg["default_source"] = list(args.source)
+        if args.target:
+            new_cfg["default_target"] = list(args.target)
+        if args.catalog:
+            new_cfg["default_catalog"] = list(args.catalog)
+        if args.part_pattern:
+            new_cfg["part_patterns"] = list(args.part_pattern)
+        save_config(new_cfg)
+        console.print(f"[green]Saved to {CONFIG_PATH}:[/]")
+        for k in ("default_source", "default_target", "default_catalog", "part_patterns"):
+            if k in new_cfg:
+                console.print(f"  {k} = {new_cfg[k]}")
+        sys.exit(0)
+    global USE_ANSI
+    USE_ANSI = not args.no_color
+    if args.no_color or BASIC:
+        console = Console(no_color=True, color_system=None, highlight=False)
+
+    # Search mode: defaults kick in if no remotes specified.
+    if args.clearjav:
+        if not args.source:
+            args.source = list(DEFAULT_SOURCE)
+        if not args.target:
+            args.target = list(DEFAULT_TARGET)
+
+    if args.search and not args.source and not args.target:
+        args.target = list(DEFAULT_TARGET)
+
+    # --scan: default to DEFAULT_TARGET only, always overwrite cache.
+    if args.scan:
+        if not args.source and not args.target:
+            args.target = list(DEFAULT_TARGET)
+        args.update = True
+
+    # Use default catalog(s) if user passed none.
+    if not args.catalog and DEFAULT_CATALOG:
+        args.catalog = list(DEFAULT_CATALOG)
+
+    # --library-issues: read-only cache scan for non-canonical filenames.
+    if args.library_issues:
+        cache = load_cache()
+        issues = find_library_issues(cache)
+        if args.format == "json" or BASIC:
+            print(json.dumps({"ok": True, **issues}))
+        else:
+            bracket = issues["bracket_names"]
+            nohyphen = issues["nohyphen_names"]
+            total = len(bracket) + len(nohyphen)
+            if not total:
+                console.print(Panel("[bold green]No library issues found.[/]", title="Library Issues"))
+            else:
+                from rich.table import Table
+                t = Table(title=f"Library Issues ({total} file(s))", show_lines=True)
+                t.add_column("Issue", style="yellow", width=14)
+                t.add_column("Current Name")
+                t.add_column("Canonical Name", style="green")
+                t.add_column("Remote", style="dim")
+                for e in bracket:
+                    t.add_row("bracket ID", Path(e["path"]).name,
+                              e["canonical_name"], e["remote"])
+                for e in nohyphen:
+                    t.add_row("no hyphen", Path(e["path"]).name,
+                              e["canonical_name"], e["remote"])
+                console.print(t)
+        sys.exit(0)
+
+    # --rename-files-batch: rename multiple files, single cache write.
+    if args.rename_files_batch:
+        try:
+            renames = json.loads(sys.stdin.read())
+        except json.JSONDecodeError as e:
+            print(json.dumps({"ok": False, "error": f"Invalid JSON on stdin: {e}"}))
+            sys.exit(1)
+        if not isinstance(renames, list):
+            print(json.dumps({"ok": False, "error": "stdin must be a JSON array"}))
+            sys.exit(1)
+        cache = load_cache()
+        results = rename_files_batch(renames, cache, rclone_bin=RCLONE_BIN)
+        ok = any(r["ok"] for r in results)
+        print(json.dumps({"ok": ok, "results": results}))
+        sys.exit(0 if ok else 1)
+
+    # --rename-file: rename one file in a remote and patch cache.
+    if args.rename_file:
+        if not args.remote or not args.old_path or not args.new_path:
+            ap.error("--rename-file requires --remote, --old-path, and --new-path.")
+        cache = load_cache()
+        result = rename_file_in_remote(
+            args.remote, args.old_path, args.new_path, cache, rclone_bin=RCLONE_BIN
+        )
+        print(json.dumps(result))
+        sys.exit(0 if result["ok"] else 1)
+
+    if not args.source and not args.target and not args.catalog:
+        ap.error("Provide at least one --source, --target, or --catalog.")
+
+    # Scan-only mode: walk remotes, write cache, summary, exit.
+    if args.scan:
+        scan_since = None
+        if args.scan_since:
+            scan_since = parse_duration(args.scan_since)
+            if not scan_since:
+                console.print(f"[red]invalid --scan-since value: {args.scan_since!r} "
+                              f"(expected e.g. 24h, 7d, 30m, 90s)[/]")
+                sys.exit(2)
+        cache = load_cache()
+        cache_meta: dict[str, dict] = {}
+        skipped: list[tuple[str, str]] = []
+        t0 = time.perf_counter()
+        if BASIC:
+            # `--scan` resolves its default target above. Report only the
+            # remotes that this scan will actually walk; falling back here to
+            # DEFAULT_SOURCE would resurrect retired source roots in job UI.
+            _all_remotes = list(args.source) + list(args.target)
+            sys.stderr.write("SCAN_START " + json.dumps({
+                "remotes": _all_remotes, "total": len(_all_remotes),
+            }) + "\n")
+            sys.stderr.flush()
+        entries = (cached_collect(args.source, "Source", skipped, cache,
+                                  use_cache=not args.no_cache, force_update=True,
+                                  cache_meta=cache_meta, scan_since=scan_since)
+                   + cached_collect(args.target, "Target", skipped, cache,
+                                    use_cache=not args.no_cache, force_update=True,
+                                    cache_meta=cache_meta, scan_since=scan_since))
+        if not args.no_cache:
+            save_cache(cache)
+        elapsed = time.perf_counter() - t0
+        if BASIC:
+            sys.stderr.write(f"Scan complete: {len(entries)} files in {elapsed:.2f}s\n")
+            sys.stderr.write(f"Cache: {CACHE_PATH}\n" if not args.no_cache
+                             else "Cache: (skipped, --no-cache)\n")
+        else:
+            console.print(f"[bold green]Scan complete:[/] {len(entries)} files in {elapsed:.2f}s")
+            if not args.no_cache:
+                console.print(f"[dim]Cache: {CACHE_PATH}[/]")
+            else:
+                console.print("[dim]Cache: (skipped, --no-cache)[/]")
+        sys.exit(0)
+
+    skipped: list[tuple[str, str]] = []
+    t0 = time.perf_counter()
+
+    if args.search or args.name:
+        search_timings: dict[str, int] = {}
+        # If --name was passed without explicit remotes, fall back to default target
+        # (catalog default already injected earlier; don't let it suppress remote defaulting).
+        if args.name and not args.search and not args.source and not args.target:
+            args.target = list(DEFAULT_TARGET)
+        # Substring name search can't be server-side filtered on most backends — cache wins.
+        # Only the ID search shape benefits from quick (server-side prefix glob).
+        if args.name and not args.quick:
+            mode, reason = "cached", "name substring search — cache is faster than rclone --include"
+        else:
+            combined = list(args.search) + list(args.name)
+            mode, reason = choose_search_mode(combined, args.quick, args.cache)
+        if BASIC:
+            sys.stderr.write(f"Mode: {mode}  ({reason})\n")
+        else:
+            mode_color = "green" if mode == "quick" else "cyan"
+            console.print(f"[{mode_color}]Mode: {mode}[/]  [dim]({reason})[/]")
+
+        phase_t0 = time.perf_counter()
+        cache = load_cache()
+        search_timings["cache_load_ms"] = round((time.perf_counter() - phase_t0) * 1000)
+        use_cache = not args.no_cache and mode == "cached"
+        cache_meta: dict[str, dict] = {}
+        phase_t0 = time.perf_counter()
+        if mode == "quick":
+            all_patterns: list[str] = []
+            for raw in args.search:
+                all_patterns.extend(query_to_include_patterns(raw))
+            all_patterns.extend(name_to_include_patterns(args.name))
+            entries = []
+            for r in args.source:
+                cache_meta[r] = {"cached": False, "age": "quick", "stale": False, "file_count": 0}
+                got = quick_search_remote(r, "Source", all_patterns, skipped)
+                entries.extend(got)
+                cache_meta[r]["file_count"] = len(got)
+            for r in args.target:
+                cache_meta[r] = {"cached": False, "age": "quick", "stale": False, "file_count": 0}
+                got = quick_search_remote(r, "Target", all_patterns, skipped)
+                entries.extend(got)
+                cache_meta[r]["file_count"] = len(got)
+        else:
+            entries = (cached_collect(args.source, "Source", skipped, cache,
+                                      use_cache, args.update, cache_meta)
+                       + cached_collect(args.target, "Target", skipped, cache,
+                                        use_cache, args.update, cache_meta))
+        search_timings["entry_collect_ms"] = round((time.perf_counter() - phase_t0) * 1000)
+        # Load each catalog separately so cache_meta gets the per-catalog count
+        # (was global total — every catalog reported the sum across all).
+        catalog_entries: list[FileEntry] = []
+        phase_t0 = time.perf_counter()
+        for cp_str in args.catalog:
+            for cp in _expand_catalog_paths([cp_str]):
+                ext = cp.suffix.lower()
+                if ext == ".csv":
+                    one = load_catalog_csv(cp, skipped)
+                elif ext == ".xml":
+                    one = load_catalog_xml(cp, skipped)
+                else:
+                    console.print(f"[yellow]WARN: unknown catalog format '{ext}' for {cp}; skipping.[/]")
+                    continue
+                catalog_entries.extend(one)
+                cache_meta[f"catalog:{cp.name}"] = {
+                    "cached": False, "age": "loaded", "stale": False,
+                    "file_count": len(one),
+                }
+        entries.extend(catalog_entries)
+        search_timings["catalog_load_ms"] = round((time.perf_counter() - phase_t0) * 1000)
+        if use_cache and args.update:
+            save_cache(cache)
+    else:
+        if args.cache and not args.no_cache:
+            cache = load_cache()
+            cache_meta: dict[str, dict] = {}
+            entries = (cached_collect(args.source, "Source", skipped, cache,
+                                      use_cache=True, force_update=False,
+                                      cache_meta=cache_meta)
+                       + cached_collect(args.target, "Target", skipped, cache,
+                                        use_cache=True, force_update=False,
+                                        cache_meta=cache_meta))
+        else:
+            remotes_by_label = ([("Source", r) for r in args.source]
+                                + [("Target", r) for r in args.target])
+            entries = collect_with_progress(remotes_by_label, skipped)
+        entries.extend(load_catalogs(args.catalog, skipped))
+
+    elapsed = time.perf_counter() - t0
+    if BASIC:
+        sys.stderr.write(f"Scanned/loaded {len(entries)} file(s) in {elapsed:.2f}s\n")
+    else:
+        console.print(f"[dim]Scanned/loaded {len(entries)} file(s) in {elapsed:.2f}s[/]")
+
+    if args.search or args.name:
+        # query_expansions: original_raw -> list of normalized IDs / wildcard patterns to look up
+        query_expansions: dict[str, list[str]] = {}
+        queries: list[str] = []
+        for raw in args.search:
+            if RANGE_RE.search(raw):
+                expanded = expand_range(raw) or []
+                normed: list[str] = []
+                for r in expanded:
+                    n = normalize_id(r)
+                    if n:
+                        normed.append(n)
+                if not normed:
+                    console.print(f"[yellow]WARN: range '{raw}' produced no valid IDs.[/]")
+                    continue
+                queries.append(raw)
+                query_expansions[raw] = normed
+                continue
+            if "*" in raw or "?" in raw:
+                q = raw.upper()
+                queries.append(q)
+                query_expansions[q] = [q]
+                continue
+            norm = normalize_id(raw)
+            if not norm:
+                console.print(f"[yellow]WARN: cannot parse '{raw}' as a JAV ID, skipping.[/]")
+                continue
+            # Use the raw (upper-cased) form for display so leading zeros are preserved
+            # (e.g. user types PRTD-027 — keep it, don't show PRTD-27). Lookup still uses
+            # the normalized form internally.
+            display = raw.upper()
+            queries.append(display)
+            query_expansions[display] = [norm]
+        phase_t0 = time.perf_counter()
+        index: dict[str, list[FileEntry]] = {}
+        for e in entries:
+            index.setdefault(e.jav_id, []).append(e)
+        search_timings["index_ms"] = round((time.perf_counter() - phase_t0) * 1000)
+        phase_t0 = time.perf_counter()
+        matches: dict[str, list[FileEntry]] = {}
+        match_traces: dict[str, dict[int, dict[str, str]]] = {}
+        for q in queries:
+            expansions = query_expansions.get(q, [q])
+            hits: list[FileEntry] = []
+            seen: set[int] = set()
+            traces: dict[int, dict[str, str]] = {}
+
+            def add_hit(entry: FileEntry, matched_query: str) -> None:
+                key = id(entry)
+                if key in seen:
+                    return
+                seen.add(key)
+                hits.append(entry)
+                traces[key] = describe_id_match(q, matched_query, entry.jav_id, len(expansions))
+
+            for sub in expansions:
+                if "*" in sub or "?" in sub:
+                    pat = sub if "#PART" in sub.upper() else sub + "*"
+                    for k, v in index.items():
+                        if fnmatch.fnmatchcase(k, pat):
+                            for e in v:
+                                add_hit(e, sub)
+                elif "#part" in sub:
+                    for e in index.get(sub, []):
+                        add_hit(e, sub)
+                else:
+                    for e in index.get(sub, []):
+                        add_hit(e, sub)
+                    for k, v in index.items():
+                        if k.startswith(sub + "#part"):
+                            for e in v:
+                                add_hit(e, sub)
+            matches[q] = hits
+            match_traces[q] = traces
+        search_timings["match_ms"] = round((time.perf_counter() - phase_t0) * 1000)
+        if args.format == "json":
+            # Structured output for tools that consume search results (e.g. the rclonex
+            # Brave extension). Includes everything needed to drive a UI: per-query hits
+            # with source/remote/path/size/mod_time, plus name-match block + skipped.
+            name_hits_json: list[FileEntry] = []
+            if args.name:
+                for e in entries:
+                    if name_match(Path(e.path).stem, args.name):
+                        name_hits_json.append(e)
+            out_obj = {
+                "queries": [
+                    {
+                        "query": q,
+                        "hits": [
+                            {"source": e.source, "remote": e.remote, "path": e.path,
+                             "full_path": e.full_path, "size": e.size,
+                             "size_human": human_size(e.size),
+                             "mod_time": e.mod_time, "jav_id": e.jav_id,
+                             **match_traces.get(q, {}).get(id(e), {})}
+                            for e in sorted(matches.get(q, []), key=lambda x: (x.jav_id, x.path.lower()))
+                        ],
+                    }
+                    for q in queries
+                ],
+                "name_matches": [
+                    {"source": e.source, "remote": e.remote, "path": e.path,
+                     "full_path": e.full_path, "size": e.size,
+                     "size_human": human_size(e.size), "mod_time": e.mod_time,
+                     "jav_id": e.jav_id, "match_kind": "name",
+                     "match_reason": "Filename search", "match_confidence": "broad",
+                     "matched_query": ", ".join(args.name), "matched_id": e.jav_id}
+                    for e in sorted(name_hits_json, key=lambda x: (x.jav_id, x.path.lower()))
+                ],
+                "name_tokens": list(args.name),
+                "cache_meta": cache_meta,
+                "skipped_count": len(skipped),
+                "elapsed_sec": round(time.perf_counter() - t0, 3),
+                "timings": search_timings,
+            }
+            print(json.dumps(out_obj))
+            id_ok = (not queries) or all(matches.values())
+            name_ok = (not args.name) or bool(name_hits_json)
+            sys.exit(0 if (id_ok and name_ok) else 1)
+        if queries:
+            if BASIC:
+                print(render_search_plain(matches, queries, cache_meta))
+            else:
+                render_search(matches, queries, cache_meta)
+        # --name results as a separate block
+        name_hits: list[FileEntry] = []
+        if args.name:
+            for e in entries:
+                if name_match(Path(e.path).stem, args.name):
+                    name_hits.append(e)
+            if BASIC:
+                print(render_name_matches_plain(name_hits, args.name, cache_meta))
+            else:
+                render_name_matches(name_hits, args.name, cache_meta)
+        # Exit code: 0 if every search query had hits AND name-search (if used) returned hits.
+        id_ok = (not queries) or all(matches.values())
+        name_ok = (not args.name) or bool(name_hits)
+        sys.exit(0 if (id_ok and name_ok) else 1)
+
+    dupes = find_dupes(entries)
+    variant_alerts = find_variant_alerts(entries)
+    if args.format == "json" and BASIC:
+        print(json.dumps(dupes_to_obj(dupes, skipped, variant_alerts)))
+        sys.exit(0)
+    if BASIC:
+        print(render_dupes_plain(dupes, skipped, variant_alerts))
+    else:
+        render_dupes(dupes, skipped, variant_alerts)
+
+    if args.format != "console":
+        out_dir = Path(args.output_dir)
+        out_dir.mkdir(parents=True, exist_ok=True)
+        stamp = datetime.now().strftime("%Y%m%d-%H%M%S")
+        targets = {"txt", "csv", "json"} if args.format == "all" else {args.format}
+        if "txt" in targets:
+            write_txt(out_dir / f"dupes-{stamp}.txt", dupes, skipped)
+        if "csv" in targets:
+            write_csv(out_dir / f"dupes-{stamp}.csv", dupes)
+        if "json" in targets:
+            write_json(out_dir / f"dupes-{stamp}.json", dupes, skipped, variant_alerts)
+        console.print(f"[dim]Reports written to {out_dir}[/]")
+
+
+if __name__ == "__main__":
+    try:
+        main()
+    except KeyboardInterrupt:
+        console.print("\n[yellow]Aborted by user (Ctrl+C). Cache not written for in-flight scans.[/]")
+        sys.exit(130)
diff --git a/tests/test_rules.py b/tests/test_rules.py
new file mode 100644
index 0000000..5e4c147
--- /dev/null
+++ b/tests/test_rules.py
@@ -0,0 +1,74 @@
+import importlib.util
+import sys
+import unittest
+from pathlib import Path
+
+
+ROOT = Path(__file__).resolve().parents[1]
+SPEC = importlib.util.spec_from_file_location("rcjav_rules", ROOT / "rc-jav.py")
+RCJAV = importlib.util.module_from_spec(SPEC)
+sys.modules[SPEC.name] = RCJAV
+SPEC.loader.exec_module(RCJAV)
+
+
+def entry(path, size=1_000, jav_id="TEST-001"):
+    return RCJAV.FileEntry(
+        source="Target",
+        remote="cq:JAV",
+        path=path,
+        size=size,
+        mod_time="",
+        jav_id=jav_id,
+    )
+
+
+class IdRuleTests(unittest.TestCase):
+    def test_builtin_multipart_shapes_keep_parts_distinct(self):
+        expected = {
+            "KV-118 - Aiba Reika_PART1.mp4": "KV-118#part1",
+            "KV-118_A.mp4": "KV-118#part1",
+            "OFJE-195-7 [480p].mp4": "OFJE-195#part7",
+            "ABC-027.mp4": "ABC-027",
+        }
+        for name, jav_id in expected.items():
+            with self.subTest(name=name):
+                self.assertEqual(RCJAV.extract_id(name), jav_id)
+
+    def test_multipart_files_do_not_form_base_duplicate_group(self):
+        files = [
+            entry("KV-118 - Aiba Reika_PART1.mp4", jav_id="KV-118"),
+            entry("KV-118 - Aiba Reika_PART2.mp4", jav_id="KV-118"),
+            entry("KV-118 - Aiba Reika_PART3.mp4", jav_id="KV-118"),
+        ]
+        self.assertEqual(RCJAV.find_dupes(files), {})
+
+    def test_large_same_id_group_gets_manual_review_risk(self):
+        files = [
+            entry("TEST-001 direct.mp4"),
+            entry("TEST-001 edit.mp4"),
+            entry("TEST-001 mirror.mp4"),
+        ]
+        risks = RCJAV.describe_dupe_risks("TEST-001", files)
+        self.assertIn("large_same_id_group", {risk["code"] for risk in risks})
+
+
+class KeepRankingTests(unittest.TestCase):
+    def test_vip_folder_beats_larger_non_vip_copy(self):
+        keep, reason = RCJAV.decide_keep_with_reason([
+            entry("ClearJAV/TEST-001.mp4", size=2_000),
+            entry("Other/TEST-001 [1080p].mkv", size=9_000),
+        ])
+        self.assertEqual(keep.path, "ClearJAV/TEST-001.mp4")
+        self.assertEqual(reason["code"], "vip_folder")
+
+    def test_ts_loses_to_non_ts_even_when_larger(self):
+        keep, reason = RCJAV.decide_keep_with_reason([
+            entry("Other/TEST-001.ts", size=9_000),
+            entry("Other/TEST-001.mp4", size=8_000),
+        ])
+        self.assertEqual(keep.path, "Other/TEST-001.mp4")
+        self.assertEqual(reason["code"], "container")
+
+
+if __name__ == "__main__":
+    unittest.main()