diff --git a/.gitignore b/.gitignore
index 6cf9326..4d495c9 100644
--- a/.gitignore
+++ b/.gitignore
@@ -5,6 +5,10 @@
 
 # Testing artefacts
 .temp-profile
+tests/.env
+tests/.env.local
+__pycache__/
+*.pyc
 
 # logs
 geckodriver.log
diff --git a/js/lib.js b/js/lib.js
index e38430e..518a6fa 100644
--- a/js/lib.js
+++ b/js/lib.js
@@ -57,6 +57,16 @@ class MissingMappedField {
     toString() {
         return `${this.value}`;
     }
+
+    // Mirror 4CAT's API serialization so JSON.stringify produces the same
+    // tagged form on both sides: 4CAT's /api/dataset/<key>/items/ endpoint,
+    // when called with `missing_fields=keep`, emits missing values as
+    // `{ __missing: true, value: <fallback> }`. Matching that shape here
+    // lets the map_item comparator deep-equal both sides without special
+    // handling.
+    toJSON() {
+        return { __missing: true, value: this.value };
+    }
 }
 
 /**
diff --git a/modules/_loader.js b/modules/_loader.js
index afae2d7..ceb0080 100644
--- a/modules/_loader.js
+++ b/modules/_loader.js
@@ -1,3 +1,8 @@
+// Load-order dependency: `wrap_for_map_item` (used below) is a free global
+// defined in js/lib.js, which manifest.json loads as a plain background
+// script before this module. There is no import for it here on purpose —
+// MV2 background scripts share one global scope. If lib.js stops being
+// loaded first, the mapper wrapper below will ReferenceError.
 async function load() {
     const imported_modules = [
         await import("./tiktok.js"),
diff --git a/modules/package.json b/modules/package.json
new file mode 100644
index 0000000..3dbc1ca
--- /dev/null
+++ b/modules/package.json
@@ -0,0 +1,3 @@
+{
+  "type": "module"
+}
diff --git a/tests/.env.example b/tests/.env.example
new file mode 100644
index 0000000..137a52b
--- /dev/null
+++ b/tests/.env.example
@@ -0,0 +1,23 @@
+# 4CAT API config for the map_item comparator (`npm run test:compare`).
+# Copy this file to .env in this directory and fill in real values.
+# .env is gitignored; .env.example is the committed template.
+
+# Base URL of the 4CAT instance to hit. No trailing slash. Default ports:
+#   :80   for nginx (production)
+#   :4000 for the Flask dev server
+FOURCAT_URL=http://localhost
+
+# API key for that 4CAT instance. Get one from the 4CAT UI; tied to your
+# user. 4CAT accepts the raw key as the Authorization header value (no
+# `Bearer ` prefix).
+FOURCAT_API_KEY=your-api-key-here
+
+# Comma-separated list of dataset keys (the 32-char ids from 4CAT dataset
+# URLs) to compare. The comparator pulls inputs from /download/<key> and
+# expected outputs from
+# /api/dataset/<key>/items/?annotations=no&missing_fields=keep&stream=true
+# for each. Datasource is read from each dataset's metadata.
+#
+# `npm run test:compare -- <key>` narrows a single run to one key; the key
+# must still be listed here.
+FOURCAT_DATASETS=key1,key2,key3
diff --git a/tests/README.md b/tests/README.md
index f1188e2..f203b60 100644
--- a/tests/README.md
+++ b/tests/README.md
@@ -1,31 +1,42 @@
 ## Tests for Zeeschuimer
 
-This folder contains **testing** code for Zeeschuimer.
+This folder contains testing code for Zeeschuimer. There are three suites,
+each with a different purpose and a different runtime environment:
 
-### Integration Tests (Selenium)
+| Suite                            | Tests                                                     | Environment        | When it runs                    | Needs                                  |
+|----------------------------------|-----------------------------------------------------------|--------------------|---------------------------------|----------------------------------------|
+| Selenium integration             | Page captures real items from each supported platform     | Real Firefox       | Reviewer-supervised, manual     | Firefox profile, sometimes a human     |
+| Duplicate-behavior unit (Jest)   | DB merge / keep / update semantics in isolation           | jsdom + fake-IDB   | `npm test` (every push)         | None                                   |
+| Module load smoke (Jest, Tier 1) | Each `modules/*.js` parses and imports cleanly            | jsdom              | `npm test` (every push)         | None                                   |
+| `map_item` comparator (Jest, Tier 2) | JS `map_item` output matches 4CAT's Python mapping per item | jsdom + cross-fetch | `npm run test:compare` (on demand) | Live 4CAT, API key, dataset key(s) |
 
-The Python + Selenium tests visit pages on supported platforms
-and see how many items are captured. If the amount of items captured is 
-unexpectedly low or high, this is flagged and may indicate that Zeeschuimer no
-longer properly captures data from the platform.
+Hermetic suites (no external dependencies) live in `npm test`. Anything that
+requires a real browser, a 4CAT server, or a human in the loop is opt-in.
 
-These tests are **supervised** i.e. they require monitoring by a human and 
+### Integration tests (Selenium)
+
+The Python + Selenium tests visit pages on supported platforms and see how
+many items are captured. If the amount of items captured is unexpectedly
+low or high, this is flagged and may indicate that Zeeschuimer no longer
+properly captures data from the platform.
+
+These tests are **supervised** — they require monitoring by a human and
 cannot run fully autonomously, since some platforms (TikTok in particular)
 occasionally show CAPTCHAs that need to be completed for a test to run
 successfully. This is also why Selenium does not run a headless Firefox.
 
-The amount of items returned per page is somewhat variable for most platforms,
-so if the number is slightly lower or higher than expected this is not 
-necessarily a problem (but worth checking).
+The amount of items returned per page is somewhat variable for most
+platforms, so if the number is slightly lower or higher than expected this
+is not necessarily a problem (but worth checking).
 
-Additionally, most platforms require logging in before (full) access to the UI
-is available. The testing script borrows a Firefox profile directory from 
-elsewhere on the system to do this. It will try to find one automatically but
-you can also pass one with the `--profiledir` argument. The idea is that you
-log in to the various sites (Instagram, etc) in your 'normal' Firefox, and the
-tests then borrow that login to interface with the website.
+Most platforms require logging in before (full) access to the UI is
+available. The testing script borrows a Firefox profile directory from
+elsewhere on the system to do this. It will try to find one automatically
+but you can also pass one with the `--profiledir` argument. Log in to the
+various sites (Instagram, etc) in your 'normal' Firefox, and the tests then
+borrow that login.
 
-Run `test.py` to run tests. Required non-standard libraries are in 
+Run `test.py` to run tests. Required non-standard libraries are in
 `requirements.txt`.
 
 Tests are defined in `tests.json` with the following structure:
@@ -35,49 +46,152 @@ Tests are defined in `tests.json` with the following structure:
   "platform id as in zeeschuimer (e.g. 'tiktok.com')": {
     "test case (e.g. 'Home feed')": {
       "url": {
-        "expected": 0,  # amount of items expected to be captured on this page
-        "more-after-scroll": false,  # whether scrolling is supposed to load more items (currently unsupported)
-        "wait": 10  # wait time before checking number of items (optional, default 5)
-      } # more URLS can be added per test case
+        "expected": 0,
+        "more-after-scroll": false,
+        "wait": 10
+      }
     }
   }
 }
 ```
 
-### Unit Tests (Jest)
-
-The JavaScript unit tests verify duplicate-handling logic in isolation using 
-a mocked Dexie database. These tests ensure that when the duplicate behavior 
-setting is changed, the correct existing record is selected for updates.
+### Jest suites
 
 **Prerequisites**
-- Node.js (v18 or later) and npm must be installed
+- Node.js (v18 or later) and npm
+- `cd tests && npm install`
+
+**Recommended: develop the tests inside Docker.** On Windows the global
+permission model can make `npm install` / `npm test` awkward to run from
+an arbitrary shell, and an agentic assistant working in auto-mode will
+hit deny-rules before it can do a `cross-fetch`-style dependency spike.
+Any minimal `node:20`-or-newer image with this repo mounted in is
+enough — install what you need, run `npm install`, run `npm test` and
+`npm run test:compare`. The host's `tests/.env` is picked up via the
+mount, and `FOURCAT_URL` can point at a 4CAT reachable from the
+container (`host.docker.internal` on Windows/Mac, the host IP on
+Linux).
+
+#### Duplicate-behavior unit tests
+
+Verify duplicate-handling logic in isolation using a mocked Dexie database.
+Ensures that when the duplicate behavior setting is changed, the correct
+existing record is selected for updates.
+
+Coverage:
+- Schema upgrade backfills `last_updated` from `timestamp_collected`
+- Compound index correctly selects most recent item by `last_updated`
+- Forward-looking behavior: "keep" → "update" targets newest record
+- Forward-looking behavior: "update" → "keep" creates new records
+- Merge: shallow merge preserves fields from both records
+- Skip: no modifications occur when duplicate found
+- Platform isolation: same `item_id` on different platforms are independent
+- Tie-breaker: when `last_updated` is equal, prefer higher `id`
+
+#### Module load smoke (Tier 1)
+
+For every file under `modules/*.js`, `tests/map_item.test.js` asserts the
+module parses and imports without throwing. Modules with a `map_item`
+export and modules without one both pass this tier — the goal is purely to
+catch a generator that emits a syntax error or an import-time throw.
+
+No data is run through `map_item` here; that work belongs in the
+comparator.
+
+#### `map_item` comparator (Tier 2)
+
+For every 4CAT dataset key listed in `FOURCAT_DATASETS`,
+`tests/map_item_compare.test.js`:
+
+1. sends a HEAD to the items endpoint and reads the datasource id from its
+   `X-4CAT-Dataset-Datasource` response header (no metadata-endpoint call)
+2. translates that id to a Zeeschuimer module name via
+   `zeeschuimer-to-4cat.json` (used in reverse)
+3. fetches `/download/<key>` (NDJSON inputs, already wrapped via
+   `wrap_for_map_item` by Zeeschuimer pre-upload) and
+   `/api/dataset/<key>/items/?annotations=no&missing_fields=keep&stream=true`
+   (expected outputs from 4CAT's Python `map_item`, as NDJSON — `stream=true`
+   avoids the JSON form's `limit=100` pagination)
+4. pairs items by `id` (or by index with a warning if `id` is missing on
+   either side), runs each input through the local `map_item`, and
+   field-by-field diffs against the expected output (4CAT's API-only
+   aggregate `missing_fields` key is excluded; per-field `{__missing:true}`
+   markers are still compared)
 
-**Setup**
+The comparator does **not** exercise `wrap_for_map_item` itself — Zeeschuimer
+applies it pre-storage and `/download/<key>` returns post-wrap items. This
+is an accepted gap; see `docs/map-item-test-plan.md`.
 
-1. Install Node.js dependencies:
-   ```bash
-   cd tests
-   npm install
-   ```
+**Configuration:** copy `tests/.env.example` to `tests/.env` and set:
+- `FOURCAT_URL` — base URL of the 4CAT instance (no trailing slash)
+- `FOURCAT_API_KEY` — raw API key (no `Bearer ` prefix)
+- `FOURCAT_DATASETS` — comma-separated list of dataset keys
 
-**Running tests**
+The comparator hard-errors at startup if any of these are missing.
+
+**Optional knob:** by default the comparator halts a dataset at its first
+failing item (reporting the rest as one skipped "halted" placeholder). To
+compare *every* item, pass `--all`:
 
 ```bash
-npm test
+npm run test:compare -- <dataset_key> --all
 ```
 
-For watch mode during development:
+`FAIL_FAST=0` (or `FAIL_FAST=false`) does the same, but prefer `--all`: an
+inline `FAIL_FAST=0 npm run …` does not reliably reach node when npm/node is
+the Windows binary run through WSL interop, and isn't env syntax in cmd.exe.
+A CLI flag crosses every shell.
+
+### Running
+
 ```bash
+# everything that's hermetic — duplicate-behavior unit + module load smoke
+npm test
+
+# watch mode for the same
 npm run test:watch
+
+# the comparator — every dataset key in FOURCAT_DATASETS
+npm run test:compare
+
+# the comparator narrowed to one dataset key (must still appear in
+# FOURCAT_DATASETS — protects against typos)
+npm run test:compare -- <dataset_key>
+
+# compare every item instead of halting at the first failure
+npm run test:compare -- <dataset_key> --all
 ```
 
-**Test coverage**
-- Schema upgrade backfills `last_updated` from `timestamp_collected`
-- Compound index correctly selects most recent item by `last_updated`
-- Forward-looking behavior: switching from "keep" to "update" targets newest record
-- Forward-looking behavior: switching from "update" to "keep" creates new records
-- Merge behavior: shallow merge preserves fields from both records
-- Skip behavior: no modifications occur when duplicate found
-- Platform isolation: same `item_id` on different platforms are independent
-- Tie-breaker: when `last_updated` is equal, prefer higher `id`
+### Where does a new test go?
+
+- **Pure data transformation, no live external state, runs anywhere.**
+  Duplicate-behavior unit suite (DB logic) or the Tier 1 smoke
+  (`map_item` static checks).
+- **Field-by-field correctness against 4CAT's Python `map_item`.** Tier 2
+  comparator. Add a dataset to `FOURCAT_DATASETS` that covers the case;
+  the comparator will pick it up.
+- **End-to-end user flow in the extension.** Selenium.
+
+### Why the environments differ
+
+The two Jest tiers run in **jsdom** rather than node env. The reasoning:
+
+- `map_item` bodies are pure data transformation, but four of them
+  (`gab`, `pinterest`, `rednote`, `truth`) call `strip_tags`, which
+  invokes `new DOMParser()`. jsdom provides a spec-compliant native
+  `DOMParser`; node env doesn't.
+- jsdom doesn't ship `fetch`. The standard workaround
+  (`undici`) crashes inside jsdom because it pokes at
+  `clearImmediate` / `markResourceTiming` / fast-now timers that jsdom
+  shadows. `cross-fetch` wraps `node-fetch` v2 internally and doesn't
+  hit those Node internals, so it works in jsdom — the comparator
+  imports `cross-fetch/polyfill` to assign `globalThis.fetch`.
+
+The tradeoff is parser parity. `cross-fetch`-via-`node-fetch` and
+jsdom's `DOMParser` are not byte-equal to Firefox's Gecko `DOMParser`,
+which is what runs in production. Whitespace handling around `<br>` and
+block elements is the usual suspect. If the comparator emits false-
+positive diffs on text fields for the four `strip_tags` modules, the
+right fix is to normalise whitespace in the comparator's `deep_equal`
+rather than chase parser parity. The Selenium tier sits above and
+provides the real-Gecko fidelity check.
diff --git a/tests/_module-info.js b/tests/_module-info.js
new file mode 100644
index 0000000..e6866a3
--- /dev/null
+++ b/tests/_module-info.js
@@ -0,0 +1,59 @@
+/**
+ * Shared helper for the map_item test drivers.
+ *
+ * Pre-validates a module by:
+ *   1. Running `node --check` on its file (syntax check; avoids the
+ *      worker-killing experimental-ESM crash when a syntax error reaches
+ *      the dynamic importer).
+ *   2. Dynamically importing it and checking for a `map_item` export.
+ *
+ * Results are cached per module name so test files that load this helper
+ * via separate Jest workers/files don't pay the spawnSync cost twice.
+ *
+ * Returns one of four states the test driver can branch on:
+ *   { state: 'ok',           map_item: <fn> }
+ *   { state: 'no_map_item' }
+ *   { state: 'syntax_error', error: <string> }
+ *   { state: 'import_error', error: <Error> }
+ */
+
+import { spawnSync } from 'node:child_process';
+import { join, dirname } from 'node:path';
+import { fileURLToPath } from 'node:url';
+
+const __dirname = dirname(fileURLToPath(import.meta.url));
+const MODULES_ROOT = join(__dirname, '..', 'modules');
+
+const syntax_cache = new Map();
+const inspect_cache = new Map();
+
+function check_module_syntax(module_name) {
+    if (syntax_cache.has(module_name)) return syntax_cache.get(module_name);
+    const module_path = join(MODULES_ROOT, `${module_name}.js`);
+    const result = spawnSync(process.execPath, ['--check', module_path], { encoding: 'utf8' });
+    const out = result.status === 0
+        ? null
+        : (result.stderr || result.stdout || `exit code ${result.status}`).trim();
+    syntax_cache.set(module_name, out);
+    return out;
+}
+
+export async function inspect_module(module_name) {
+    if (inspect_cache.has(module_name)) return inspect_cache.get(module_name);
+    const syntax_error = check_module_syntax(module_name);
+    let result;
+    if (syntax_error) {
+        result = { state: 'syntax_error', error: syntax_error };
+    } else {
+        try {
+            const mod = await import(`../modules/${module_name}.js`);
+            result = typeof mod.map_item === 'function'
+                ? { state: 'ok', map_item: mod.map_item }
+                : { state: 'no_map_item' };
+        } catch (e) {
+            result = { state: 'import_error', error: e };
+        }
+    }
+    inspect_cache.set(module_name, result);
+    return result;
+}
diff --git a/tests/duplicate-behavior.test.js b/tests/duplicate-behavior.test.js
index 031f663..9f0662b 100644
--- a/tests/duplicate-behavior.test.js
+++ b/tests/duplicate-behavior.test.js
@@ -5,8 +5,9 @@
  * update or merge behaviors to duplicates across navigation boundaries.
  */
 
+import 'fake-indexeddb/auto';
+
 let Dexie;
-require('fake-indexeddb/auto');
 
 // Mock browser extension APIs
 global.browser = {
diff --git a/tests/jest.compare.config.cjs b/tests/jest.compare.config.cjs
new file mode 100644
index 0000000..070e2ff
--- /dev/null
+++ b/tests/jest.compare.config.cjs
@@ -0,0 +1,20 @@
+// Tier 2 — live comparator against a 4CAT instance.
+//
+// Runs only `map_item_compare.test.js`. Requires FOURCAT_URL,
+// FOURCAT_API_KEY, and FOURCAT_DATASETS to be set in tests/.env. Hard-errors
+// rather than silently skipping if env is missing.
+//
+// Env is jsdom so that the four modules using `strip_tags` (gab, pinterest,
+// rednote, truth) have a native DOMParser. The comparator uses cross-fetch
+// to provide a jsdom-friendly fetch (jsdom doesn't ship fetch and undici
+// crashes inside jsdom).
+module.exports = {
+  testEnvironment: 'jsdom',
+  testMatch: ['**/map_item_compare.test.js'],
+  testPathIgnorePatterns: ['/node_modules/'],
+  transform: {},
+  moduleFileExtensions: ['js', 'json'],
+  setupFiles: ['<rootDir>/setup-globals.cjs'],
+  testTimeout: 30000,
+  verbose: true
+};
diff --git a/tests/jest.config.cjs b/tests/jest.config.cjs
new file mode 100644
index 0000000..239abbc
--- /dev/null
+++ b/tests/jest.config.cjs
@@ -0,0 +1,12 @@
+// Default Jest config — Tier 1 only (duplicate-behavior + load-only smoke).
+// The comparator is excluded; invoke it via `npm run test:compare`.
+module.exports = {
+  testEnvironment: 'jsdom',
+  testMatch: ['**/*.test.js'],
+  testPathIgnorePatterns: ['/node_modules/', 'map_item_compare\\.test\\.js$'],
+  transform: {},
+  moduleFileExtensions: ['js', 'json'],
+  collectCoverageFrom: ['*.test.js'],
+  setupFiles: ['<rootDir>/setup-globals.cjs'],
+  verbose: true
+};
diff --git a/tests/jest.config.js b/tests/jest.config.js
deleted file mode 100644
index 7dd5b02..0000000
--- a/tests/jest.config.js
+++ /dev/null
@@ -1,8 +0,0 @@
-module.exports = {
-  testEnvironment: 'jsdom',
-  testMatch: ['**/*.test.js'],
-  transform: {},
-  moduleFileExtensions: ['js', 'json'],
-  collectCoverageFrom: ['duplicate-behavior.test.js'],
-  verbose: true
-};
diff --git a/tests/map_item.test.js b/tests/map_item.test.js
new file mode 100644
index 0000000..774c083
--- /dev/null
+++ b/tests/map_item.test.js
@@ -0,0 +1,49 @@
+/**
+ * Load-only smoke for every module under `modules/*.js`.
+ *
+ * For each module file, runs `inspect_module()` and asserts the module:
+ *   - parses (no SyntaxError)
+ *   - imports without throwing
+ *   - either exports a `map_item` function, or doesn't (both are fine here)
+ *
+ * No data is fed through `map_item`. That work belongs in the comparator
+ * (Tier 2 — `npm run test:compare`), where real items pulled from a 4CAT
+ * dataset provide both the input and the expected output.
+ *
+ * Catches: parse errors, import-time throws, broken top-level statements.
+ * Does NOT catch: anything that requires running `map_item` on real input.
+ */
+
+import { readdirSync } from 'node:fs';
+import { join, dirname } from 'node:path';
+import { fileURLToPath } from 'node:url';
+import { inspect_module } from './_module-info.js';
+
+const __dirname = dirname(fileURLToPath(import.meta.url));
+const MODULES_ROOT = join(__dirname, '..', 'modules');
+
+const module_files = readdirSync(MODULES_ROOT)
+    .filter(f => f.endsWith('.js') && !f.startsWith('_'));
+
+const module_info = {};
+for (const file of module_files) {
+    const name = file.replace(/\.js$/, '');
+    module_info[name] = await inspect_module(name);
+}
+
+describe('module load smoke', () => {
+    for (const file of module_files) {
+        const name = file.replace(/\.js$/, '');
+        test(`modules/${file} loads cleanly`, () => {
+            const info = module_info[name];
+            if (info.state === 'syntax_error') {
+                throw new Error(`syntax error in modules/${file}:\n${info.error}`);
+            }
+            if (info.state === 'import_error') {
+                throw new Error(`import failed for modules/${file}: ${info.error.message}`);
+            }
+            // 'ok' or 'no_map_item' — both acceptable at this tier.
+            expect(['ok', 'no_map_item']).toContain(info.state);
+        });
+    }
+});
diff --git a/tests/map_item_compare.test.js b/tests/map_item_compare.test.js
new file mode 100644
index 0000000..8e06979
--- /dev/null
+++ b/tests/map_item_compare.test.js
@@ -0,0 +1,480 @@
+/**
+ * Compare JS map_item output against 4CAT's Python map_item via dataset keys.
+ *
+ * For each 4CAT dataset key in FOURCAT_DATASETS, this test:
+ *   1. HEADs the items endpoint to read the datasource id from the
+ *      `X-4CAT-Dataset-*` response headers (no metadata-endpoint dependency)
+ *   2. translates that id back to a Zeeschuimer module name via
+ *      zeeschuimer-to-4cat.json (used in reverse)
+ *   3. inspects the local module (must export map_item)
+ *   4. fetches in parallel, both as NDJSON:
+ *        /download/<key>                       -> INPUTS (post-wrap)
+ *        /api/dataset/<key>/items/?annotations=no&missing_fields=keep&stream=true
+ *                                              -> mapped EXPECTED OUTPUTS
+ *   5. runs each input through the local map_item, then pairs by the
+ *      resulting MAPPED `id` — which can differ from the raw input id (e.g.
+ *      instagram maps to the post shortcode, not the numeric pk) — and
+ *      deep-equals each mapped result against the corresponding expected
+ *      output.
+ *
+ * The items endpoint is fetched with `stream=true` (NDJSON): its JSON-array
+ * form paginates at `limit=100`, silently dropping rows on larger datasets.
+ * `annotations=no` drops processor-added fields; `missing_fields=keep` keeps
+ * unmapped fields as `{ __missing: true, value: "" }` markers (matching the JS
+ * side) and additionally adds a comma-joined `missing_fields` summary key.
+ * That summary is API-only — the JS map_item never emits it — so it is
+ * excluded from the diff (see API_ONLY_FIELDS); the per-field markers it
+ * summarizes are still compared.
+ *
+ * Items from /download/<key> already have `wrap_for_map_item` applied by
+ * Zeeschuimer pre-upload, so they're fed to map_item directly without
+ * re-wrapping. The trade-off is that this comparator does not exercise
+ * `wrap_for_map_item` itself — see docs/map-item-test-plan.md for the
+ * accepted-gap rationale.
+ *
+ * Environment notes (fetch + DOMParser):
+ *   - jsdom env so `strip_tags` (used by gab/pinterest/rednote/truth) has
+ *     a native DOMParser.
+ *   - jsdom doesn't ship `fetch`. Spiked three candidates on 2026-06-03
+ *     under node:20-alpine:
+ *       * `undici`     — crashes at import in jsdom (pokes at
+ *                        clearImmediate/markResourceTiming/fast-now
+ *                        timers that jsdom shadows).
+ *       * `node-fetch` v3 — imports clean but `res.text()` throws
+ *                        `ReferenceError: TextDecoder is not defined`
+ *                        (jsdom doesn't expose TextDecoder as a global).
+ *       * `cross-fetch/polyfill` — clean import + working round-trip.
+ *     So this file imports `cross-fetch/polyfill`, which assigns
+ *     `globalThis.fetch` when undefined.
+ *
+ * Invocation:
+ *   npm run test:compare                 # runs every key in FOURCAT_DATASETS
+ *   npm run test:compare -- <key>        # narrows to one key (must be in
+ *                                        #   FOURCAT_DATASETS to avoid typos)
+ *
+ * Hard-errors at registration time if FOURCAT_URL, FOURCAT_API_KEY, or
+ * FOURCAT_DATASETS is missing — by Tier 2 contract these are required.
+ */
+
+import 'cross-fetch/polyfill';
+import 'dotenv/config';
+import { readFileSync, existsSync } from 'node:fs';
+import { join, dirname } from 'node:path';
+import { fileURLToPath } from 'node:url';
+import { inspect_module } from './_module-info.js';
+
+const __dirname = dirname(fileURLToPath(import.meta.url));
+
+const FOURCAT_URL = process.env.FOURCAT_URL?.replace(/\/$/, '');
+const FOURCAT_API_KEY = process.env.FOURCAT_API_KEY;
+
+// Hard-fail if env is missing — Tier 2 contract.
+function require_env(name, value, placeholder_values = []) {
+    if (!value || placeholder_values.includes(value)) {
+        throw new Error(
+            `${name} is not configured. Set it in tests/.env (see tests/.env.example).`
+        );
+    }
+    return value;
+}
+require_env('FOURCAT_URL', FOURCAT_URL);
+require_env('FOURCAT_API_KEY', FOURCAT_API_KEY, ['your-api-key-here']);
+
+const FOURCAT_DATASETS = require_env(
+    'FOURCAT_DATASETS',
+    process.env.FOURCAT_DATASETS,
+    ['key1,key2,key3'],
+)
+    .split(',')
+    .map(k => k.trim())
+    .filter(k => k.length > 0);
+
+if (FOURCAT_DATASETS.length === 0) {
+    throw new Error('FOURCAT_DATASETS parsed as empty. Set a comma-separated list of dataset keys in tests/.env.');
+}
+
+// Optional narrowing to a single dataset key. The `npm run test:compare --
+// <key>` form is handled by run-compare.mjs, which sets COMPARE_DATASET; jest
+// itself would mis-read a bare key as a test-path-pattern filter and silently
+// run nothing. A narrowed key must still be declared in FOURCAT_DATASETS —
+// erroring on an unlisted key catches typos and keeps the dataset list the
+// single source of truth.
+const COMPARE_DATASET = process.env.COMPARE_DATASET?.trim() || undefined;
+if (COMPARE_DATASET && !FOURCAT_DATASETS.includes(COMPARE_DATASET)) {
+    throw new Error(
+        `COMPARE_DATASET=${COMPARE_DATASET} is not listed in FOURCAT_DATASETS. ` +
+        `Add it to tests/.env before narrowing the run to it.`
+    );
+}
+
+const DATASET_KEYS_TO_RUN = COMPARE_DATASET ? [COMPARE_DATASET] : FOURCAT_DATASETS;
+
+// 4CAT datasource id -> Zeeschuimer module name. The on-disk map is
+// authored in the natural direction (zeeschuimer -> 4cat); flip here.
+const ID_MAP_PATH = join(__dirname, 'zeeschuimer-to-4cat.json');
+const ZEESCHUIMER_TO_4CAT = existsSync(ID_MAP_PATH)
+    ? JSON.parse(readFileSync(ID_MAP_PATH, 'utf8'))
+    : {};
+const FOURCAT_TO_ZEESCHUIMER = Object.fromEntries(
+    Object.entries(ZEESCHUIMER_TO_4CAT)
+        .filter(([k]) => !k.startsWith('_'))
+        .map(([z, f]) => [f, z])
+);
+
+// When true (default), comparison of a dataset stops at its first failing
+// item; the remaining items are reported as a single skipped "halted"
+// placeholder rather than one failure each. Disable it with the `--all`
+// launcher flag (preferred — crosses every shell) or FAIL_FAST=0. Trim
+// because `set FAIL_FAST=0 && ...` in cmd.exe includes the trailing space;
+// treat both '0' and 'false' (case-insensitive) as off.
+const FAIL_FAST_RAW = (process.env.FAIL_FAST ?? '').trim().toLowerCase();
+const FAIL_FAST = FAIL_FAST_RAW !== '0' && FAIL_FAST_RAW !== 'false';
+
+function auth_headers(extra = {}) {
+    return {
+        // 4CAT accepts the raw key without a `Bearer ` prefix.
+        'Authorization': FOURCAT_API_KEY,
+        ...extra,
+    };
+}
+
+async function fetch_headers(url) {
+    const res = await fetch(url, { method: 'HEAD', headers: auth_headers() });
+    if (!res.ok) throw new Error(`HTTP ${res.status} from HEAD ${url}`);
+    return res.headers;
+}
+
+async function fetch_ndjson(url) {
+    const res = await fetch(url, { headers: auth_headers() });
+    const text = await res.text();
+    if (!res.ok) throw new Error(`HTTP ${res.status} from ${url}: ${text}`);
+    return text
+        .split('\n')
+        .filter(line => line.trim().length > 0)
+        .map((line, i) => {
+            try { return JSON.parse(line); }
+            catch (e) { throw new Error(`bad NDJSON at line ${i} of ${url}: ${e.message}`); }
+        });
+}
+
+function normalize(value) {
+    return JSON.parse(JSON.stringify(value));
+}
+
+function deep_equal(a, b) {
+    if (a === b) return true;
+    if (a === null || b === null) return a === b;
+    if (typeof a !== typeof b) return false;
+    if (typeof a !== 'object') return false;
+    if (Array.isArray(a) !== Array.isArray(b)) return false;
+    if (Array.isArray(a)) {
+        if (a.length !== b.length) return false;
+        return a.every((v, i) => deep_equal(v, b[i]));
+    }
+    const a_keys = Object.keys(a);
+    const b_keys = Object.keys(b);
+    if (a_keys.length !== b_keys.length) return false;
+    return a_keys.every(k => k in b && deep_equal(a[k], b[k]));
+}
+
+function diff_objects(js_obj, py_obj) {
+    const diffs = [];
+    const keys = new Set([...Object.keys(js_obj ?? {}), ...Object.keys(py_obj ?? {})]);
+    for (const key of keys) {
+        const in_js = js_obj && key in js_obj;
+        const in_py = py_obj && key in py_obj;
+        if (!in_js) {
+            diffs.push({ key, kind: 'only_python', python: py_obj[key] });
+        } else if (!in_py) {
+            diffs.push({ key, kind: 'only_js', js: js_obj[key] });
+        } else if (!deep_equal(js_obj[key], py_obj[key])) {
+            diffs.push({ key, kind: 'mismatch', js: js_obj[key], python: py_obj[key] });
+        }
+    }
+    return diffs;
+}
+
+function format_diffs(diffs) {
+    return diffs.map(d => {
+        if (d.kind === 'only_js') {
+            return `  + only in JS:     ${d.key} = ${JSON.stringify(d.js)}`;
+        }
+        if (d.kind === 'only_python') {
+            return `  - only in Python: ${d.key} = ${JSON.stringify(d.python)}`;
+        }
+        return `  ~ ${d.key}\n      JS:     ${JSON.stringify(d.js)}\n      Python: ${JSON.stringify(d.python)}`;
+    }).join('\n');
+}
+
+function format_error_with_location(err) {
+    if (!err) return String(err);
+    const message = err.message || String(err);
+    const stack = err.stack || '';
+    const module_frames = stack.split('\n')
+        .filter(l => l.includes('/modules/') || l.includes('\\modules\\'))
+        .slice(0, 3)
+        .map(l => l.trim());
+    return module_frames.length
+        ? `${message}\n  ${module_frames.join('\n  ')}`
+        : message;
+}
+
+// Map each input through the local map_item, then pair the mapped result
+// against the expected output by `id`. Pairing MUST key on the mapped id:
+// some modules emit an `id` that differs from the raw input id — instagram,
+// for instance, maps to the post shortcode (`node.code`), not the numeric pk
+// — so pairing raw input ids against the API's already-mapped ids would match
+// nothing. Falls back to index pairing (with a logged warning) if either side
+// lacks a usable id. A throw inside map_item is captured per-item and surfaced
+// later as that item's failure.
+function map_and_pair(inputs, outputs, map_item, dataset_key) {
+    // Map every input up front so pairing can key on the mapped id.
+    const mapped = inputs.map(input => {
+        try {
+            return { input, js_result: map_item(input), error: null };
+        } catch (e) {
+            return {
+                input,
+                js_result: null,
+                error: new Error(`JS map_item threw: ${format_error_with_location(e)}`),
+            };
+        }
+    });
+
+    const probe_mapped = mapped.find(m => m.js_result)?.js_result;
+    const probe_out = outputs[0];
+    const has_id_mapped = probe_mapped && 'id' in probe_mapped && probe_mapped.id != null;
+    const has_id_out = probe_out && 'id' in probe_out && probe_out.id != null;
+
+    if (!has_id_mapped || !has_id_out) {
+        // eslint-disable-next-line no-console
+        console.warn(
+            `[compare] ${dataset_key}: no usable 'id' on ${!has_id_mapped ? 'map_item output' : '/items'} ` +
+            `side — falling back to index pairing for this dataset.`
+        );
+        const n = Math.min(mapped.length, outputs.length);
+        return {
+            mode: 'index',
+            pairs: Array.from({ length: n }, (_, i) => ({
+                input: mapped[i].input,
+                js_result: mapped[i].js_result,
+                error: mapped[i].error,
+                expected: outputs[i],
+                id: i,
+            })),
+            input_count: inputs.length,
+            output_count: outputs.length,
+            unmatched_inputs: [],
+            unmatched_outputs: [],
+        };
+    }
+
+    const by_id_out = new Map();
+    for (const item of outputs) by_id_out.set(String(item.id), item);
+
+    const pairs = [];
+    const unmatched_inputs = [];
+    for (const m of mapped) {
+        // A throw produces no mapped id to pair on. Surface it as its own
+        // failing item (labelled with the raw input id) rather than burying it
+        // in the unmatched-id list — otherwise an id-transforming module hides
+        // the actual map_item error behind a generic "unmatched input" report.
+        if (m.error) {
+            const label = m.input && m.input.id != null ? String(m.input.id) : '(no id)';
+            pairs.push({ input: m.input, js_result: null, error: m.error, expected: null, id: label });
+            continue;
+        }
+        // Key on the mapped id; a successful map whose id matches no output is
+        // a genuine pairing miss and goes to unmatched_inputs.
+        const lookup_id = m.js_result && m.js_result.id != null ? String(m.js_result.id) : null;
+        const expected = lookup_id != null ? by_id_out.get(lookup_id) : undefined;
+        if (expected) {
+            pairs.push({ input: m.input, js_result: m.js_result, error: null, expected, id: lookup_id });
+            by_id_out.delete(lookup_id);
+        } else {
+            unmatched_inputs.push(lookup_id);
+        }
+    }
+    return {
+        mode: 'id',
+        pairs,
+        input_count: inputs.length,
+        output_count: outputs.length,
+        unmatched_inputs,
+        unmatched_outputs: Array.from(by_id_out.keys()),
+    };
+}
+
+// Recover the datasource id from a dataset's response headers. 4CAT exposes it
+// directly as `X-4CAT-Dataset-Datasource`. Older responses may only carry
+// `X-4CAT-Dataset-Type` (the datasource id with a `-search`/`-import` suffix),
+// so fall back to stripping that — anchored to end-of-string because
+// datasource ids can themselves contain hyphens (e.g. `xiaohongshu-comments`).
+// The result is translated to a Zeeschuimer module via FOURCAT_TO_ZEESCHUIMER.
+function datasource_id_from_headers(headers) {
+    const datasource = headers.get('x-4cat-dataset-datasource');
+    if (datasource) return datasource.trim();
+    const type = headers.get('x-4cat-dataset-type');
+    if (type) return type.trim().replace(/-(search|import)$/, '');
+    return null;
+}
+
+// Fields 4CAT's API attaches to every mapped item that the JS map_item never
+// produces, so they would otherwise diff as spurious "only_python" entries.
+// `missing_fields` is a comma-joined summary of which fields came back as
+// MissingMappedField — redundant with the per-field `{__missing:true}`
+// markers, which ARE compared.
+const API_ONLY_FIELDS = new Set(['missing_fields']);
+
+function strip_api_fields(obj) {
+    if (!obj || typeof obj !== 'object' || Array.isArray(obj)) return obj;
+    const out = {};
+    for (const k of Object.keys(obj)) {
+        if (!API_ONLY_FIELDS.has(k)) out[k] = obj[k];
+    }
+    return out;
+}
+
+// Diff each paired (already-mapped) JS result against 4CAT's expected output.
+// map_item was run up front during pairing — so we could key on the mapped id
+// — so here we only diff, or report an input whose map_item threw. With
+// FAIL_FAST on (default), stop at the first failing item and record how many
+// were left unchecked — so one bad item yields a single failure plus one
+// skipped "halted" placeholder, not N failures.
+function compare_pairs(pairs) {
+    const results = [];
+    let halted_count = 0;
+    for (let i = 0; i < pairs.length; i++) {
+        const { id, js_result, error, expected } = pairs[i];
+        let message = null;
+        if (error) {
+            message = error.message;
+        } else {
+            const diffs = diff_objects(
+                strip_api_fields(normalize(js_result)),
+                strip_api_fields(normalize(expected)),
+            );
+            if (diffs.length > 0) {
+                message = `${diffs.length} field(s) differ between JS and 4CAT:\n${format_diffs(diffs)}`;
+            }
+        }
+        results.push({ id, ok: message === null, message });
+        if (message !== null && FAIL_FAST) {
+            halted_count = pairs.length - (i + 1);
+            break;
+        }
+    }
+    return { results, halted_count };
+}
+
+// Pre-pass: for each dataset, resolve the datasource (HEAD), fetch items, and
+// run the comparison up front, so tests register with knowable counts and a
+// deterministic pass/fail per item. Fetch/setup failures become a single
+// "setup" failure inside that dataset's describe.
+const dataset_state = {};
+for (const key of DATASET_KEYS_TO_RUN) {
+    try {
+        // The same items URL serves double duty: a HEAD reveals the datasource
+        // (via X-4CAT-Dataset-* headers) with no body; the GET pulls the mapped
+        // rows. `stream=true` avoids the JSON form's limit=100 pagination, which
+        // would silently drop rows (and break id-pairing) on larger datasets.
+        const items_url = `${FOURCAT_URL}/api/dataset/${key}/items/?annotations=no&missing_fields=keep&stream=true`;
+        const headers = await fetch_headers(items_url);
+        const datasource_id = datasource_id_from_headers(headers);
+        if (!datasource_id) {
+            throw new Error(
+                `no datasource id in response headers for ${key} ` +
+                `(looked for X-4CAT-Dataset-Datasource / X-4CAT-Dataset-Type)`
+            );
+        }
+        const module_name = FOURCAT_TO_ZEESCHUIMER[datasource_id] ?? datasource_id;
+        const module_state = await inspect_module(module_name);
+
+        if (module_state.state === 'ok') {
+            const [inputs, outputs] = await Promise.all([
+                fetch_ndjson(`${FOURCAT_URL}/download/${key}`),
+                fetch_ndjson(items_url),
+            ]);
+            const pairing = map_and_pair(inputs, outputs, module_state.map_item, key);
+            const comparison = compare_pairs(pairing.pairs);
+            dataset_state[key] = { datasource_id, module_name, module_state, pairing, comparison };
+        } else {
+            dataset_state[key] = { datasource_id, module_name, module_state };
+        }
+    } catch (e) {
+        dataset_state[key] = { error: e };
+    }
+}
+
+for (const dataset_key of DATASET_KEYS_TO_RUN) {
+    const info = dataset_state[dataset_key];
+
+    if (info.error) {
+        describe(`map_item compare: dataset ${dataset_key}`, () => {
+            test('setup', () => { throw info.error; });
+        });
+        continue;
+    }
+
+    const { datasource_id, module_name, module_state, pairing, comparison } = info;
+    const label = `${dataset_key} (datasource: ${datasource_id}, module: ${module_name})`;
+
+    if (module_state.state === 'no_map_item') {
+        describe(`map_item compare: ${label}`, () => {
+            test.skip(`modules/${module_name}.js has no map_item — nothing to compare`, () => {});
+        });
+        continue;
+    }
+    if (module_state.state === 'syntax_error' || module_state.state === 'import_error') {
+        const msg = module_state.state === 'syntax_error'
+            ? `syntax error:\n${module_state.error}`
+            : `import failed: ${module_state.error.message}`;
+        describe(`map_item compare: ${label}`, () => {
+            test('module loads', () => { throw new Error(msg); });
+        });
+        continue;
+    }
+
+    describe(`map_item compare: ${label}`, () => {
+        test('pairing', () => {
+            const messages = [];
+            if (pairing.input_count !== pairing.output_count) {
+                messages.push(
+                    `input count ${pairing.input_count} != output count ${pairing.output_count}`
+                );
+            }
+            if (pairing.unmatched_inputs.length) {
+                const shown = pairing.unmatched_inputs.slice(0, 5).join(', ');
+                const extra = pairing.unmatched_inputs.length > 5
+                    ? ` (+${pairing.unmatched_inputs.length - 5} more)`
+                    : '';
+                messages.push(`unmatched input ids: ${shown}${extra}`);
+            }
+            if (pairing.unmatched_outputs.length) {
+                const shown = pairing.unmatched_outputs.slice(0, 5).join(', ');
+                const extra = pairing.unmatched_outputs.length > 5
+                    ? ` (+${pairing.unmatched_outputs.length - 5} more)`
+                    : '';
+                messages.push(`unmatched output ids: ${shown}${extra}`);
+            }
+            if (pairing.mode === 'index') {
+                messages.push(`paired by index (no usable 'id' field) — diffs may be misaligned`);
+            }
+            if (messages.length) throw new Error(messages.join('\n'));
+        });
+
+        comparison.results.forEach(({ id, ok, message }, i) => {
+            test(`item ${i} (id=${id})`, () => {
+                if (!ok) throw new Error(message);
+            });
+        });
+
+        if (comparison.halted_count > 0) {
+            test.skip(
+                `halted after first failure — ${comparison.halted_count} later item(s) not compared ` +
+                `(pass --all, or set FAIL_FAST=0, to compare every item)`,
+                () => {},
+            );
+        }
+    });
+}
diff --git a/tests/package-lock.json b/tests/package-lock.json
index cc8f457..ada8011 100644
--- a/tests/package-lock.json
+++ b/tests/package-lock.json
@@ -8,7 +8,9 @@
       "name": "zeeschuimer-db-tests",
       "version": "1.0.0",
       "devDependencies": {
+        "cross-fetch": "^4.0.0",
         "dexie": "^3.2.4",
+        "dotenv": "^16.4.5",
         "fake-indexeddb": "^5.0.1",
         "jest": "^29.7.0",
         "jest-environment-jsdom": "^29.7.0"
@@ -1597,6 +1599,16 @@
         "node": "^14.15.0 || ^16.10.0 || >=18.0.0"
       }
     },
+    "node_modules/cross-fetch": {
+      "version": "4.1.0",
+      "resolved": "https://registry.npmjs.org/cross-fetch/-/cross-fetch-4.1.0.tgz",
+      "integrity": "sha512-uKm5PU+MHTootlWEY+mZ4vvXoCn4fLQxT9dSc1sXVMSFkINTJVN8cAQROpwcKm8bJ/c7rgZVIBWzH5T78sNZZw==",
+      "dev": true,
+      "license": "MIT",
+      "dependencies": {
+        "node-fetch": "^2.7.0"
+      }
+    },
     "node_modules/cross-spawn": {
       "version": "7.0.6",
       "resolved": "https://registry.npmjs.org/cross-spawn/-/cross-spawn-7.0.6.tgz",
@@ -1758,6 +1770,19 @@
         "node": ">=12"
       }
     },
+    "node_modules/dotenv": {
+      "version": "16.6.1",
+      "resolved": "https://registry.npmjs.org/dotenv/-/dotenv-16.6.1.tgz",
+      "integrity": "sha512-uBq4egWHTcTt33a72vpSG0z3HnPuIl6NqYcTrKEg2azoEyl2hpW0zqlxysq2pK9HlDIHyHyakeYaYnSAwd8bow==",
+      "dev": true,
+      "license": "BSD-2-Clause",
+      "engines": {
+        "node": ">=12"
+      },
+      "funding": {
+        "url": "https://dotenvx.com"
+      }
+    },
     "node_modules/dunder-proto": {
       "version": "1.0.1",
       "resolved": "https://registry.npmjs.org/dunder-proto/-/dunder-proto-1.0.1.tgz",
@@ -3466,6 +3491,52 @@
       "dev": true,
       "license": "MIT"
     },
+    "node_modules/node-fetch": {
+      "version": "2.7.0",
+      "resolved": "https://registry.npmjs.org/node-fetch/-/node-fetch-2.7.0.tgz",
+      "integrity": "sha512-c4FRfUm/dbcWZ7U+1Wq0AwCyFL+3nt2bEw05wfxSz+DWpWsitgmSgYmy2dQdWyKC1694ELPqMs/YzUSNozLt8A==",
+      "dev": true,
+      "license": "MIT",
+      "dependencies": {
+        "whatwg-url": "^5.0.0"
+      },
+      "engines": {
+        "node": "4.x || >=6.0.0"
+      },
+      "peerDependencies": {
+        "encoding": "^0.1.0"
+      },
+      "peerDependenciesMeta": {
+        "encoding": {
+          "optional": true
+        }
+      }
+    },
+    "node_modules/node-fetch/node_modules/tr46": {
+      "version": "0.0.3",
+      "resolved": "https://registry.npmjs.org/tr46/-/tr46-0.0.3.tgz",
+      "integrity": "sha512-N3WMsuqV66lT30CrXNbEjx4GEwlow3v6rr4mCcv6prnfwhS01rkgyFdjPNBYd9br7LpXV1+Emh01fHnq2Gdgrw==",
+      "dev": true,
+      "license": "MIT"
+    },
+    "node_modules/node-fetch/node_modules/webidl-conversions": {
+      "version": "3.0.1",
+      "resolved": "https://registry.npmjs.org/webidl-conversions/-/webidl-conversions-3.0.1.tgz",
+      "integrity": "sha512-2JAn3z8AR6rjK8Sm8orRC0h/bcl/DqL7tRPdGZ4I1CjdF+EaMLmYxBHyXuKL849eucPFhvBoxMsflfOb8kxaeQ==",
+      "dev": true,
+      "license": "BSD-2-Clause"
+    },
+    "node_modules/node-fetch/node_modules/whatwg-url": {
+      "version": "5.0.0",
+      "resolved": "https://registry.npmjs.org/whatwg-url/-/whatwg-url-5.0.0.tgz",
+      "integrity": "sha512-saE57nupxk6v3HY35+jzBwYa0rKSy0XR8JSxZPwgLr7ys0IBzhGviA1/TUGJLmSVqs8pb9AnvICXEuOHLprYTw==",
+      "dev": true,
+      "license": "MIT",
+      "dependencies": {
+        "tr46": "~0.0.3",
+        "webidl-conversions": "^3.0.0"
+      }
+    },
     "node_modules/node-int64": {
       "version": "0.4.0",
       "resolved": "https://registry.npmjs.org/node-int64/-/node-int64-0.4.0.tgz",
diff --git a/tests/package.json b/tests/package.json
index dc3654c..763321c 100644
--- a/tests/package.json
+++ b/tests/package.json
@@ -1,13 +1,17 @@
 {
   "name": "zeeschuimer-db-tests",
   "version": "1.0.0",
-  "description": "Unit tests for Zeeschuimer duplicate handling logic",
+  "description": "Unit tests for Zeeschuimer duplicate handling logic and map_item generator output",
+  "type": "module",
   "scripts": {
-    "test": "jest",
-    "test:watch": "jest --watch"
+    "test": "node --experimental-vm-modules node_modules/jest/bin/jest.js --config jest.config.cjs",
+    "test:watch": "node --experimental-vm-modules node_modules/jest/bin/jest.js --config jest.config.cjs --watch",
+    "test:compare": "node run-compare.mjs"
   },
   "devDependencies": {
+    "cross-fetch": "^4.0.0",
     "dexie": "^3.2.4",
+    "dotenv": "^16.4.5",
     "fake-indexeddb": "^5.0.1",
     "jest": "^29.7.0",
     "jest-environment-jsdom": "^29.7.0"
diff --git a/tests/run-compare.mjs b/tests/run-compare.mjs
new file mode 100644
index 0000000..57efb66
--- /dev/null
+++ b/tests/run-compare.mjs
@@ -0,0 +1,53 @@
+/**
+ * Launcher for the Tier 2 map_item comparator (`npm run test:compare`).
+ *
+ *   npm run test:compare              -> compares every key in FOURCAT_DATASETS
+ *   npm run test:compare -- <key>     -> narrows the run to a single key
+ *   npm run test:compare -- <key> --all   -> compare every item (no fail-fast)
+ *   npm run test:compare -- <key> -t "id=123"   -> key + forwarded jest flags
+ *
+ * Why this exists instead of invoking jest directly: jest treats any bare
+ * positional argument as a test-path-pattern filter. A 4CAT dataset key
+ * (`5daeba72a2dfbb5ed8c855f824a61570`) matches no test file path, so
+ * `jest <key>` silently discovers zero tests and exits "green" having run
+ * nothing. This launcher intercepts the first non-flag argument, hands it to
+ * the comparator through the COMPARE_DATASET env var, and forwards only the
+ * remaining flags to jest — so the key never reaches jest's argv.
+ */
+
+import { spawn } from 'node:child_process';
+import { fileURLToPath } from 'node:url';
+import { dirname, join } from 'node:path';
+
+const __dirname = dirname(fileURLToPath(import.meta.url));
+const args = process.argv.slice(2);
+
+// First non-flag arg (if any) is the dataset key to narrow to.
+const dataset_key = args.find(a => !a.startsWith('-'));
+const flags = args.filter(a => a !== dataset_key);
+
+// `--all` (alias `--no-fail-fast`) compares every item instead of halting at
+// the first failure. It's offered as a flag, not only via the FAIL_FAST env
+// var, because `FAIL_FAST=0 npm run ...` does not reliably reach node when
+// npm/node is the Windows binary invoked through WSL interop, and isn't env
+// syntax at all in cmd.exe. A CLI flag crosses every shell; the env var still
+// works where it propagates.
+const disable_fail_fast = flags.includes('--all') || flags.includes('--no-fail-fast');
+const jest_flags = flags.filter(f => f !== '--all' && f !== '--no-fail-fast');
+
+const env = { ...process.env };
+if (dataset_key) env.COMPARE_DATASET = dataset_key;
+if (disable_fail_fast) env.FAIL_FAST = '0';
+
+const jest_bin = join(__dirname, 'node_modules', 'jest', 'bin', 'jest.js');
+const child = spawn(
+    process.execPath,
+    ['--experimental-vm-modules', jest_bin, '--config', 'jest.compare.config.cjs', ...jest_flags],
+    { stdio: 'inherit', cwd: __dirname, env },
+);
+
+child.on('exit', code => process.exit(code ?? 1));
+child.on('error', err => {
+    console.error(`failed to launch jest: ${err.message}`);
+    process.exit(1);
+});
diff --git a/tests/setup-globals.cjs b/tests/setup-globals.cjs
new file mode 100644
index 0000000..b55e659
--- /dev/null
+++ b/tests/setup-globals.cjs
@@ -0,0 +1,45 @@
+/**
+ * Make js/lib.js's helpers available as globals inside the Jest test
+ * environment, mirroring how the browser sees them after the manifest
+ * loads lib.js as a plain script.
+ *
+ * map_item bodies reference these as free identifiers (MappedItem,
+ * MissingMappedField, strip_tags, normalize_url_encoding, ...). Without
+ * this shim they'd hit ReferenceError as soon as a test invokes map_item.
+ *
+ * Names are auto-discovered from lib.js by regex-matching top-level
+ * `function name(...)` and `class Name ...` declarations. Adding a helper
+ * to lib.js makes it available to tests without touching this file.
+ */
+
+const fs = require('node:fs');
+const path = require('node:path');
+
+const lib_source = fs.readFileSync(
+    path.join(__dirname, '..', 'js', 'lib.js'),
+    'utf8',
+);
+
+// Match `function name(` and `class Name {` / `class Name extends` at
+// column 0 of a line. lib.js is a classic script with all top-level
+// declarations unindented; requiring column 0 keeps nested helpers (like
+// the `_traverse_data` IIFE inside `traverse_data`) from being exposed.
+const NAME_PATTERN = /^(?:function|class)\s+([A-Za-z_$][A-Za-z0-9_$]*)\b/gm;
+const EXPOSED_NAMES = Array.from(
+    lib_source.matchAll(NAME_PATTERN),
+    m => m[1],
+);
+
+if (EXPOSED_NAMES.length === 0) {
+    throw new Error(
+        'setup-globals.cjs: no top-level function/class declarations found in js/lib.js — ' +
+        'auto-discovery regex may be broken. Tests will ReferenceError if not fixed.'
+    );
+}
+
+const factory = new Function(`
+${lib_source}
+return { ${EXPOSED_NAMES.join(', ')} };
+`);
+
+Object.assign(globalThis, factory());
diff --git a/tests/translation-errors.md b/tests/translation-errors.md
new file mode 100644
index 0000000..fcc160d
--- /dev/null
+++ b/tests/translation-errors.md
@@ -0,0 +1,430 @@
+# Auto-generator translation errors
+
+Patterns of incorrect Python → JavaScript translation observed in
+auto-generated `modules/*.js` files. Each entry has a search pattern so
+this doc doubles as a checklist when reviewing a new auto-generator PR.
+
+When an entry is fixed at the generator level (no longer appears in
+fresh output), mark it `[fixed]` and keep the entry around — useful
+history when something regresses.
+
+## How to use
+
+- Found a new pattern? Add an entry below following the template.
+- Reviewing a generator PR? `grep` each `Search pattern` against the
+  changed module files. Anything that hits is worth a manual look.
+- Iterating on the generator prompt? The "Why" lines are the
+  feedback to add — they describe the exact Python-vs-JS semantic
+  difference the LLM keeps missing.
+
+## Template
+
+```
+### <short-name>
+
+**Status:** open | fixed in generator | accepted
+
+**Why it happens:** <one-line description of the Python-vs-JS difference>
+
+**Wrong JS:**
+```js
+<the broken pattern>
+```
+
+**Correct JS:**
+```js
+<what it should look like>
+```
+
+**Example:** `modules/<file>.js:<line>`
+
+**Search pattern:** `<grep-able regex>`
+```
+
+---
+
+## Observed patterns
+
+### `in` operator on strings
+
+**Status:** open
+
+**Why it happens:** In Python, `"x" in some_string` is a substring check.
+In JavaScript, the `in` operator only works on **objects** and checks for
+property/key existence; using it with a string on the right-hand side
+throws `TypeError: cannot use 'in' operator to search for "x" in <string>`.
+
+**Wrong JS:**
+```js
+const is_polaris = '__typename' in item && 'polaris' in item.__typename.toLowerCase();
+```
+
+**Correct JS:**
+```js
+const is_polaris = '__typename' in item && item.__typename.toLowerCase().includes('polaris');
+```
+
+**Example:** `modules/instagram.js:513`
+
+**Search pattern:** `'[^']+' in [a-zA-Z_$][\w$]*\.` — quoted string followed
+by `in` followed by a method call. Quick rough check: `grep -E "' in [a-zA-Z]" modules/`
+
+**Watch out for partial fixes:** seen as `'polaris' in (item.__typename ?? '').toLowerCase()`
+— adding `?? ''` guards against `undefined` but the `in` operator itself
+still throws on the resulting *string*. The fix is `.includes()`, not just
+defaulting the operand.
+
+---
+
+### Python f-string syntax left in single-quoted JS strings
+
+**Status:** open
+
+**Why it happens:** Python `f"... {var} ..."` interpolates. JS uses
+template literals (backticks) with `${var}`. The auto-generator leaves the
+`{var}` notation in a regular single- or double-quoted JS string, which is
+just literal text — no interpolation happens.
+
+**Wrong JS:**
+```js
+throw new MapItemException('Unable to parse item: different user {user.id} and owner {owner.id}');
+```
+
+**Correct JS:**
+```js
+throw new MapItemException(`Unable to parse item: different user ${user.id} and owner ${owner.id}`);
+```
+
+**Example:** `modules/instagram.js:754`
+
+**Search pattern:** `'[^']*\{[a-zA-Z_$][\w$.]*\}[^']*'` or `"[^"]*\{[a-zA-Z_$][\w$.]*\}[^"]*"`
+— a non-template-literal string containing `{identifier}` or `{identifier.path}`.
+Quick check: `grep -nE "['\"][^'\"]*\{[a-zA-Z_][a-zA-Z0-9_.]*\}[^'\"]*['\"]" modules/`
+
+---
+
+### `?? {}` default that defeats subsequent truthy checks
+
+**Status:** open
+
+**Why it happens:** When porting Python's `node.get('user') or {}` (which is
+intended to make subsequent code safe to call), the generator emits
+`node.user ?? {}`. That's a *valid* Python-equivalent, **but** any following
+`if (user && owner) { ... }` guard then never short-circuits because both
+`{}` references are truthy. The check ends up reading "if user and owner
+*objects* exist" when the intent was "if user and owner data exist."
+Subsequent property accesses then compare real ids/usernames against
+`undefined` on the missing side, often throwing.
+
+**Wrong JS:**
+```js
+const user  = node.user  ?? {};
+const owner = node.owner ?? {};
+if (user && owner) {
+    if (user.id === owner.id) { /* … */ }
+    else if (user.username !== owner.username) {
+        throw new MapItemException('different user and owner');
+    }
+}
+```
+
+**Correct JS** (depending on intent — pick one):
+```js
+// (a) drop the defaults so truthy guard means "both present"
+const user  = node.user;
+const owner = node.owner;
+if (user && owner) { /* compare */ }
+```
+```js
+// (b) check for actual content, not just object identity
+const user  = node.user  ?? {};
+const owner = node.owner ?? {};
+if (Object.keys(user).length && Object.keys(owner).length) { /* compare */ }
+```
+
+**Example:** `modules/instagram.js:748-756`
+
+**Search pattern:** `\?\?\s*\{\s*\}` — any `?? {}` occurrence is worth a
+review of subsequent guards. Quick check: `grep -nE "\?\?\s*\{\s*\}" modules/`
+
+---
+
+### Bare relative path as a statement (junk auto-imports section)
+
+**Status:** open
+
+**Why it happens:** The generator emits an "auto-generated imports" marker
+block at the top of the module but writes the import target as a bare
+relative path on its own line (`../js/lib.js`) instead of a real `import`
+statement. JS parses that as `..` then `.` then `/js/lib.js` — syntax error.
+
+**Wrong JS:**
+```js
+// === auto-generated imports for map_item — DO NOT EDIT BY HAND ===
+../js/lib.js
+// === end auto-generated imports ===
+```
+
+**Correct JS** (one of):
+```js
+// === auto-generated imports — DO NOT EDIT BY HAND ===
+// Provided as globals by js/lib.js (loaded via manifest.json):
+//   MappedItem, MissingMappedField, MapItemException, traverse_data,
+//   strip_tags, normalize_url_encoding, formatUtcTimestamp
+// === end auto-generated imports ===
+```
+
+Or, if a real import is intended, an ESM import with named bindings:
+```js
+import { MappedItem, MissingMappedField } from '../js/lib.js';
+```
+
+**Example:** seen historically in `modules/tiktok.js:2`
+
+**Search pattern:** `^\.\./` at the start of a line in module files.
+Quick check: `grep -nE "^\.\." modules/*.js`
+
+---
+
+### Key-existence check (`'X' in obj`) used where Python intended value-truthiness (`obj.get('X')`)
+
+**Status:** open
+
+**Why it happens:** Python's `if node.get('usertags'):` is a *truthy check on
+the value* — returns False if the key is missing **or** if the value is
+`None`/empty/falsy. The generator translates this to `if ('usertags' in
+node)`, which in JS is a *key-existence check* — returns True even when
+the value is `null`. Subsequent property accesses on the null value then
+throw `Cannot read properties of null`.
+
+**Wrong JS:**
+```js
+const usertags = 'usertags' in node ? node.usertags.in.map(...).join(',') : '';
+// node.usertags can be null → .in.map blows up
+```
+
+**Correct JS:**
+```js
+const usertags = node.usertags ? node.usertags.in.map(...).join(',') : '';
+```
+
+**Example:** `modules/instagram.js:777`
+
+**Search pattern:** `'[^']+' in [a-zA-Z_$][\w$]*\s*\?` — quoted-string `in`
+identifier followed by `?` (ternary). Quick check:
+`grep -nE "'[^']+' in [a-zA-Z_]+ \?" modules/`
+
+---
+
+### Datetime serialization format mismatch
+
+**Status:** open
+
+**Why it happens:** Python's `datetime.utcfromtimestamp(t).strftime('%Y-%m-%d %H:%M:%S')`
+produces `"2026-05-13 21:27:31"` — space-separated, no timezone marker. JS's
+`new Date(t * 1000).toISOString()` produces `"2026-05-13T21:27:31.000Z"` — T
+separator, milliseconds, Z. The generator emits the JS `.toISOString()` form
+instead of using the existing `formatUtcTimestamp` helper from lib.js that
+mimics Python's output exactly.
+
+**Wrong JS:**
+```js
+collected_at = new Date(node.taken_at * 1000).toISOString();
+```
+
+**Correct JS:**
+```js
+collected_at = formatUtcTimestamp(node.taken_at);
+// formatUtcTimestamp is defined in js/lib.js as:
+//   new Date(unixSeconds * 1000).toISOString().replace('T', ' ').slice(0, 19)
+```
+
+**Example:** `modules/instagram.js:782`
+
+**Search pattern:** `new Date\([^)]+\)\.toISOString\(\)` — any use of
+`.toISOString()`. The helper should be used instead. Quick check:
+`grep -nE "\.toISOString\(\)" modules/`
+
+---
+
+### `re.findall` capture groups vs JS `.match` with /g flag
+
+**Status:** open
+
+**Why it happens:** Python's `re.findall(r'#(\w+)', s)` returns the **capture
+group contents**: `['lotr', 'woodart']`. JS's `s.match(/#(\w+)/g)` (with the
+global flag) returns the **full matches**: `['#lotr', '#woodart']` — capture
+groups are ignored. The generator translates the regex literally without
+adjusting for this semantic difference, so the resulting strings keep
+prefixes/wrappers that Python would have stripped.
+
+**Wrong JS:**
+```js
+hashtags: caption.match(/#([^\s!@#$%^&*()_+{}:"|<>?;',./`~]+)/g)?.join(',')
+// produces "#lotr,#woodart"
+```
+
+**Correct JS:**
+```js
+// Option A: strip the literal prefix from each full match
+hashtags: caption.match(/#([^\s...]+)/g)?.map(h => h.slice(1)).join(',') ?? ''
+// Option B: use matchAll to get capture groups properly
+hashtags: [...caption.matchAll(/#([^\s...]+)/g)].map(m => m[1]).join(',') ?? ''
+```
+
+**Example:** `modules/instagram.js:812` (also 766, 870 — three copies)
+
+**Search pattern:** `\.match\(/[^/]*\([^/]*\)[^/]*/g\)` — any `.match()` with
+a global-flag regex containing a capture group. Quick check:
+`grep -nE "\.match\(/.*\(.*\).*\/g\)" modules/`
+
+---
+
+### `undefined` field values get dropped from JSON, but Python's `None` becomes `null`
+
+**Status:** open
+
+**Why it happens:** When `JSON.stringify` encounters an object property whose
+value is `undefined`, it **omits the key entirely** from the output. Python's
+`json.dumps` serializes `None` as `null`, keeping the key. The generator
+writes assignments like `location.city = node.location.city` where the
+right-hand side can be `undefined`, producing missing keys in JS output
+that show up as `only in Python: <field> = null` diffs against 4CAT.
+
+**Wrong JS:**
+```js
+location.city = node.location.city;  // undefined if .city missing
+// JSON.stringify({location_city: undefined}) → "{}" (key omitted)
+
+body: caption,  // null if no caption — Python returns "" here, not null
+```
+
+**Correct JS:**
+```js
+// Whichever fallback Python uses for that specific field:
+location.city = node.location.city ?? null;   // some fields → null
+body: caption ?? '',                          // other fields → ""
+```
+
+**Example:** `modules/instagram.js:745, 853` (`null` flavor),
+559, 648, 798 (`""` flavor for `body`)
+
+**Note:** Python's choice of `None` vs `""` is per-field — there's no
+universal rule. When the comparator reports `~ X  JS: null  Python: ""` use
+`?? ''`. When it reports `- only in Python: X = null` use `?? null`. The
+distinction matters because the JS output should match Python's choice
+exactly for that field.
+
+**Search pattern:** harder to grep automatically — any property assignment
+where the RHS could be `undefined`/`null` and the resulting field is
+expected to appear in the mapped output. Look at "only in Python: X = null"
+and "~ X  JS: null  Python: \"\"" diffs in the comparator output to find
+specific cases.
+
+---
+
+### Object-reference inequality used as type check
+
+**Status:** open
+
+**Why it happens:** The generator emits `caption !== new MissingMappedField('')`
+to mean "caption is not a missing-marker", but `new MissingMappedField('')`
+creates a fresh object every time, and `!==` on objects compares references.
+The expression is **always true**, so the conditional never takes the
+"missing" branch. Likely originates from Python idioms like `caption != ""`
+or `caption is not None`, mistranslated through the MissingMappedField
+abstraction.
+
+**Wrong JS:**
+```js
+hashtags: caption !== new MissingMappedField('') ? caption.match(...) : '',
+// !== between two different object references is always true
+```
+
+**Correct JS:**
+```js
+// If the intent was "if caption has content", just truthy-check it:
+hashtags: caption ? caption.match(...) : '',
+// If the intent was "if caption is not a MissingMappedField instance":
+hashtags: !(caption instanceof MissingMappedField) ? caption.match(...) : '',
+```
+
+**Example:** `modules/instagram.js:812` (and two other copies)
+
+**Search pattern:** `!== new [A-Z]` or `=== new [A-Z]` — any equality
+comparison with a freshly-constructed object. Quick check:
+`grep -nE "(!==|===) new [A-Z]" modules/`
+
+---
+
+### `.method()` chain on potentially-null result
+
+**Status:** open
+
+**Why it happens:** In Python, calling a method on `None` raises
+`AttributeError`, which 4CAT sometimes catches. In JS, calling a method on
+`null`/`undefined` throws `TypeError: Cannot read properties of null
+(reading '<method>')`. The generator emits the same dotted chain without
+optional-chaining (`?.`) protection.
+
+**Wrong JS:**
+```js
+hashtags: caption !== new MissingMappedField('')
+    ? caption.match(/#([^\s!@#$%^&*()_+{}:"|<>?;',./`~]+)/g)?.join(',')
+    : '',
+```
+(here `caption` is allowed to be `null`, so `caption.match(...)` blows up
+on null caption)
+
+**Correct JS:**
+```js
+hashtags: caption
+    ? caption.match(/#([^\s!@#$%^&*()_+{}:"|<>?;',./`~]+)/g)?.join(',') ?? ''
+    : '',
+```
+
+**Example:** `modules/instagram.js:809`
+
+**Search pattern:** harder to grep — needs reading. Worth manual review of
+any field that uses `caption.match`, `something.split`, `something.join`
+without `?.` on a value that could be null/undefined.
+
+---
+
+## Generator prompt feedback (running list)
+
+Concrete things to fold into the generator's prompt over time:
+
+1. **Python `x in y` where `y` is a string** → use `y.includes(x)` in JS,
+   never `x in y`.
+2. **Python f-strings** → use JS template literals (backticks) with
+   `${...}` syntax. Never leave `{...}` in single- or double-quoted strings.
+3. **`?? {}` after a `.get(...) or {}` translation** → only use this if the
+   following code does property-access. If the following code does a
+   truthy guard (`if (x && y)`), drop the default and use just `node.user`.
+4. **Method chains on possibly-null values** → use `?.` (optional
+   chaining) instead of `.` whenever the receiver could be null/undefined.
+5. **The auto-imports header block** → emit either real `import { ... }`
+   statements with valid relative paths, or a comment-only header.
+   Never emit bare paths as JS statements.
+6. **Python `node.get('X')` truthy check** → in JS, use `node.X` (or
+   `node.X != null`), not `'X' in node`. The `in` operator checks key
+   existence, which is True even for explicit-null values.
+7. **Datetime serialization** → use the `formatUtcTimestamp` helper from
+   lib.js (which mimics Python's `strftime('%Y-%m-%d %H:%M:%S')` format),
+   not `new Date(...).toISOString()` (which has a different output shape:
+   T separator, milliseconds, Z suffix).
+8. **`re.findall` with capture groups** → in JS, `.match(/.../g)` returns
+   full matches, NOT capture groups. To get capture-group behavior, use
+   either `[...s.matchAll(/.../g)].map(m => m[1])` or post-process the
+   full matches with `.map(...)` to strip the literal parts.
+9. **Object-reference equality (`!== new X(...)`)** → never. Creating an
+   object with `new` produces a fresh reference; `===`/`!==` compares
+   identity. Use `instanceof X` for type checks, or compare values
+   directly. The MissingMappedField "is this missing?" check should be
+   `caption instanceof MissingMappedField` or just truthy-check the value.
+10. **Python `None` → JSON `null` vs JS `undefined` → omitted** — when a
+    field's value could be missing and Python returns `null` for it,
+    JS must explicitly assign `null` (not leave the value as `undefined`).
+    `JSON.stringify` drops `undefined` keys silently. Use `value ?? null`
+    when the field is expected to appear in the mapped output.
diff --git a/tests/zeeschuimer-to-4cat.json b/tests/zeeschuimer-to-4cat.json
new file mode 100644
index 0000000..f7de942
--- /dev/null
+++ b/tests/zeeschuimer-to-4cat.json
@@ -0,0 +1,7 @@
+{
+  "_comment": "Maps Zeeschuimer module filenames (without .js) to 4CAT datasource ids when they differ. Default behavior is identity — only include entries where the two diverge. Discovered via http://localhost/api/datasources/.",
+  "9gag": "ninegag",
+  "truth": "truthsocial",
+  "rednote": "xiaohongshu",
+  "rednote-comments": "xiaohongshu-comments"
+}