feat(tagging+archetypes): add Pillowfort/Politics/Midrange/Toolbox tagging and unify archetype presence skip logic

This commit is contained in:
matt 2025-09-19 11:53:52 -07:00
parent f2a76d2ffc
commit 6d6243d6be
47 changed files with 21133 additions and 839 deletions

View file

@ -0,0 +1,33 @@
import json
import os
from pathlib import Path
ROOT = Path(__file__).resolve().parents[2]
SCRIPT = ROOT / 'code' / 'scripts' / 'build_theme_catalog.py'
OUTPUT = ROOT / 'config' / 'themes' / 'theme_list_test_regression.json'
def test_generic_description_regression():
# Run build with summary enabled directed to temp output
env = os.environ.copy()
env['EDITORIAL_INCLUDE_FALLBACK_SUMMARY'] = '1'
# Avoid writing real catalog file; just produce alternate output
import subprocess
import sys
cmd = [sys.executable, str(SCRIPT), '--output', str(OUTPUT)]
res = subprocess.run(cmd, capture_output=True, text=True, env=env)
assert res.returncode == 0, res.stderr
data = json.loads(OUTPUT.read_text(encoding='utf-8'))
summary = data.get('description_fallback_summary') or {}
# Guardrails tightened (second wave). Prior baseline: ~357 generic (309 + 48).
# New ceiling: <= 365 total generic and <52% share. Future passes should lower further.
assert summary.get('generic_total', 0) <= 365, summary
assert summary.get('generic_pct', 100.0) < 52.0, summary
# Basic shape checks
assert 'top_generic_by_frequency' in summary
assert isinstance(summary['top_generic_by_frequency'], list)
# Clean up temp output file
try:
OUTPUT.unlink()
except Exception:
pass