{
  "schema": 1,
  "source": "https://makespdf.com/ai/benchmark.json",
  "markdownCompanion": "https://makespdf.com/ai/benchmark.md",
  "liveLeaderboard": "https://makespdf.com/ai#benchmarks",
  "skillFile": "https://makespdf.com/skills/pdf-template-author.md",
  "lastRefreshIso": "2026-05-13T06:54:01.225Z",
  "summaries": [
    {
      "provider": "openrouter-claude-sonnet",
      "model": "anthropic/claude-sonnet-4.6",
      "totalTests": 6,
      "passCount": 6,
      "renderCount": 6,
      "cleanRate": 1,
      "avgCyclesUsed": 1.6666666666666667,
      "avgLatencyMs": 78406,
      "totalInTokens": 300170,
      "totalOutTokens": 62245,
      "meanFirstAttemptSkill": 0.9895833333333334,
      "skillRows": 6,
      "runCostUSD": 1.834185,
      "outputPricePerMTok": 15,
      "skillModules": {
        "tableAuthoring": {
          "meanScore": 0.975,
          "applicableRows": 5
        },
        "templateVars": {
          "meanScore": 1,
          "applicableRows": 6
        }
      },
      "perTest": [
        {
          "test": "generate-invoice",
          "scenario": "generate",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "adapt-invoice",
          "scenario": "adapt",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "paginate-invoice",
          "scenario": "paginate",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "generate-cv",
          "scenario": "cv",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "fix-broken",
          "scenario": "fix",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 0.9375
        },
        {
          "test": "chat-edit-invoice",
          "scenario": "chat-edit",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        }
      ],
      "narrative": "Clean sweep with no errors and only one warning across all tests. The sole slip is a T2 layout rule: it declared a stretch column header (\"Metric\") without pairing it with a `1fr`/`auto-stretch` column to absorb surplus width — a recurring DSL gotcha that caught it once. Otherwise, template variable handling and table authoring are essentially flawless; the 1.67 average cycles reflects minor self-correction, not structural confusion.",
      "narrativeModel": "openrouter-claude-sonnet:anthropic/claude-sonnet-4.6",
      "narrativeCostUSD": 0.006315
    },
    {
      "provider": "openrouter-claude-haiku",
      "model": "anthropic/claude-haiku-4.5",
      "totalTests": 6,
      "passCount": 6,
      "renderCount": 6,
      "cleanRate": 1,
      "avgCyclesUsed": 2,
      "avgLatencyMs": 42077,
      "totalInTokens": 353468,
      "totalOutTokens": 99966,
      "meanFirstAttemptSkill": 0.9895833333333334,
      "skillRows": 6,
      "runCostUSD": 0.853298,
      "outputPricePerMTok": 5,
      "skillModules": {
        "tableAuthoring": {
          "meanScore": 0.975,
          "applicableRows": 5
        },
        "templateVars": {
          "meanScore": 1,
          "applicableRows": 6
        }
      },
      "perTest": [
        {
          "test": "generate-invoice",
          "scenario": "generate",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "adapt-invoice",
          "scenario": "adapt",
          "passed": true,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "paginate-invoice",
          "scenario": "paginate",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "generate-cv",
          "scenario": "cv",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "fix-broken",
          "scenario": "fix",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 0.9375
        },
        {
          "test": "chat-edit-invoice",
          "scenario": "chat-edit",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        }
      ],
      "narrative": "Clean sweep across all six tests with near-perfect skill scores and no errors. The only notable slip is a stretch-column header misconfiguration in a table — declaring a \"Metric\" header without a corresponding `1fr`/`auto-stretch` column to absorb surplus width. Otherwise unremarkable in the best sense: consistently resolves within 2 cycles and handles template variables, layout adaptation, and pagination without fumbling.",
      "narrativeModel": "openrouter-claude-sonnet:anthropic/claude-sonnet-4.6",
      "narrativeCostUSD": 0.004839
    },
    {
      "provider": "openrouter-gpt5",
      "model": "openai/gpt-5",
      "totalTests": 6,
      "passCount": 6,
      "renderCount": 6,
      "cleanRate": 1,
      "avgCyclesUsed": 1.8333333333333333,
      "avgLatencyMs": 64258,
      "totalInTokens": 277204,
      "totalOutTokens": 36121,
      "meanFirstAttemptSkill": 1,
      "skillRows": 6,
      "runCostUSD": 0.707715,
      "outputPricePerMTok": 10,
      "skillModules": {
        "tableAuthoring": {
          "meanScore": 1,
          "applicableRows": 6
        },
        "templateVars": {
          "meanScore": 1,
          "applicableRows": 6
        }
      },
      "perTest": [
        {
          "test": "generate-invoice",
          "scenario": "generate",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "adapt-invoice",
          "scenario": "adapt",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "paginate-invoice",
          "scenario": "paginate",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "generate-cv",
          "scenario": "cv",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "fix-broken",
          "scenario": "fix",
          "passed": true,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "chat-edit-invoice",
          "scenario": "chat-edit",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        }
      ],
      "narrative": "Perfect score across all six tests with no errors or warnings. The fix-broken task needed 3 cycles to resolve, suggesting it doesn't always self-correct broken DSL immediately, but it gets there cleanly. Otherwise unremarkable in failure patterns — there are none.",
      "narrativeModel": "openrouter-claude-sonnet:anthropic/claude-sonnet-4.6",
      "narrativeCostUSD": 0.004083
    },
    {
      "provider": "openrouter-gpt5-mini",
      "model": "openai/gpt-5-mini",
      "totalTests": 6,
      "passCount": 6,
      "renderCount": 6,
      "cleanRate": 1,
      "avgCyclesUsed": 1.6666666666666667,
      "avgLatencyMs": 22598,
      "totalInTokens": 258382,
      "totalOutTokens": 30126,
      "meanFirstAttemptSkill": 0.9340277777777778,
      "skillRows": 6,
      "runCostUSD": 0.1248475,
      "outputPricePerMTok": 2,
      "skillModules": {
        "tableAuthoring": {
          "meanScore": 0.975,
          "applicableRows": 5
        },
        "templateVars": {
          "meanScore": 0.888888888888889,
          "applicableRows": 6
        }
      },
      "perTest": [
        {
          "test": "generate-invoice",
          "scenario": "generate",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "adapt-invoice",
          "scenario": "adapt",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 0.6666666666666667
        },
        {
          "test": "paginate-invoice",
          "scenario": "paginate",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "generate-cv",
          "scenario": "cv",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "fix-broken",
          "scenario": "fix",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 0.9375
        },
        {
          "test": "chat-edit-invoice",
          "scenario": "chat-edit",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        }
      ],
      "narrative": "Strong across the board but shows a recurring pattern of needing a correction cycle to clean up self-introduced issues — four of six tests required two attempts. The characteristic slip is in column-width semantics: it labels a header as a stretch column without assigning a corresponding `1fr`/`auto-stretch` column type. It also hallucinated a `{{notes}}` template variable not present in the sample data, suggesting it fills gaps from intuition rather than strict schema inspection.",
      "narrativeModel": "openrouter-claude-sonnet:anthropic/claude-sonnet-4.6",
      "narrativeCostUSD": 0.009144
    },
    {
      "provider": "openrouter-gpt5-4-mini",
      "model": "openai/gpt-5.4-mini",
      "totalTests": 6,
      "passCount": 5,
      "renderCount": 5,
      "cleanRate": 0.8333333333333334,
      "avgCyclesUsed": 2,
      "avgLatencyMs": 17277,
      "totalInTokens": 302352,
      "totalOutTokens": 45728,
      "meanFirstAttemptSkill": 0.9875,
      "skillRows": 5,
      "runCostUSD": 0.43254,
      "outputPricePerMTok": 4.5,
      "skillModules": {
        "tableAuthoring": {
          "meanScore": 0.96875,
          "applicableRows": 4
        },
        "templateVars": {
          "meanScore": 1,
          "applicableRows": 5
        }
      },
      "perTest": [
        {
          "test": "generate-invoice",
          "scenario": "generate",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "adapt-invoice",
          "scenario": "adapt",
          "passed": true,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "paginate-invoice",
          "scenario": "paginate",
          "passed": false,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": "content",
          "firstAttemptScore": null
        },
        {
          "test": "generate-cv",
          "scenario": "cv",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "fix-broken",
          "scenario": "fix",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 0.9375
        },
        {
          "test": "chat-edit-invoice",
          "scenario": "chat-edit",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        }
      ],
      "narrative": "Strong across generation and editing tasks, with near-perfect template variable handling and clean first attempts. The one content failure is on pagination, where it produced incorrect output despite no API issues. Table authoring shows a recurring tendency to declare stretch column headers without a corresponding `1fr`/`auto-stretch` column to absorb the surplus.",
      "narrativeModel": "openrouter-claude-sonnet:anthropic/claude-sonnet-4.6",
      "narrativeCostUSD": 0.007527
    },
    {
      "provider": "openrouter-gpt5-4-nano",
      "model": "openai/gpt-5.4-nano",
      "totalTests": 6,
      "passCount": 6,
      "renderCount": 6,
      "cleanRate": 1,
      "avgCyclesUsed": 1.8333333333333333,
      "avgLatencyMs": 23167,
      "totalInTokens": 280573,
      "totalOutTokens": 33241,
      "meanFirstAttemptSkill": 0.9895833333333334,
      "skillRows": 6,
      "runCostUSD": 0.09766585000000001,
      "outputPricePerMTok": 1.25,
      "skillModules": {
        "tableAuthoring": {
          "meanScore": 0.975,
          "applicableRows": 5
        },
        "templateVars": {
          "meanScore": 1,
          "applicableRows": 6
        }
      },
      "perTest": [
        {
          "test": "generate-invoice",
          "scenario": "generate",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "adapt-invoice",
          "scenario": "adapt",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "paginate-invoice",
          "scenario": "paginate",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "generate-cv",
          "scenario": "cv",
          "passed": true,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "fix-broken",
          "scenario": "fix",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 0.9375
        },
        {
          "test": "chat-edit-invoice",
          "scenario": "chat-edit",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        }
      ],
      "narrative": "Strong overall performer — all six tests pass with no errors, and template variable handling is spotless. The one recurring slip is a table column-width mismatch: it labels a header as stretch (e.g. \"Metric\") without assigning a corresponding `1fr`/`auto-stretch` column, suggesting it handles header semantics and column sizing as independent concerns rather than a paired rule. Needs up to three cycles to settle the CV layout, but converges cleanly without escalating errors.",
      "narrativeModel": "openrouter-claude-sonnet:anthropic/claude-sonnet-4.6",
      "narrativeCostUSD": 0.007884
    },
    {
      "provider": "openrouter-gemini-pro",
      "model": "google/gemini-2.5-pro",
      "totalTests": 6,
      "passCount": 6,
      "renderCount": 6,
      "cleanRate": 1,
      "avgCyclesUsed": 2.8333333333333335,
      "avgLatencyMs": 46624,
      "totalInTokens": 480316,
      "totalOutTokens": 119230,
      "meanFirstAttemptSkill": 0.9895833333333334,
      "skillRows": 6,
      "runCostUSD": 1.792695,
      "outputPricePerMTok": 10,
      "skillModules": {
        "tableAuthoring": {
          "meanScore": 0.975,
          "applicableRows": 5
        },
        "templateVars": {
          "meanScore": 1,
          "applicableRows": 6
        }
      },
      "perTest": [
        {
          "test": "generate-invoice",
          "scenario": "generate",
          "passed": true,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "adapt-invoice",
          "scenario": "adapt",
          "passed": true,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 2,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "paginate-invoice",
          "scenario": "paginate",
          "passed": true,
          "cyclesUsed": 5,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "generate-cv",
          "scenario": "cv",
          "passed": true,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "fix-broken",
          "scenario": "fix",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 0.9375
        },
        {
          "test": "chat-edit-invoice",
          "scenario": "chat-edit",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        }
      ],
      "narrative": "Perfect pass rate, but convergence is uneven: pagination burns 5 cycles before landing, and two other tests need 3. The one concrete content slip is mismatching a stretch column header (`Metric`) without a corresponding `1fr`/`auto-stretch` column to absorb surplus space — a T2 layout rule it reliably trips on. Otherwise output is clean across template vars and table authoring with no hard errors.",
      "narrativeModel": "openrouter-claude-sonnet:anthropic/claude-sonnet-4.6",
      "narrativeCostUSD": 0.006762
    },
    {
      "provider": "openrouter-grok",
      "model": "x-ai/grok-4",
      "totalTests": 6,
      "passCount": 6,
      "renderCount": 6,
      "cleanRate": 1,
      "avgCyclesUsed": 3,
      "avgLatencyMs": 206032,
      "totalInTokens": 444162,
      "totalOutTokens": 72744,
      "meanFirstAttemptSkill": 1,
      "skillRows": 6,
      "runCostUSD": 2.423646,
      "outputPricePerMTok": 15,
      "skillModules": {
        "tableAuthoring": {
          "meanScore": 1,
          "applicableRows": 5
        },
        "templateVars": {
          "meanScore": 1,
          "applicableRows": 6
        }
      },
      "perTest": [
        {
          "test": "generate-invoice",
          "scenario": "generate",
          "passed": true,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "adapt-invoice",
          "scenario": "adapt",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "paginate-invoice",
          "scenario": "paginate",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "generate-cv",
          "scenario": "cv",
          "passed": true,
          "cyclesUsed": 4,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "fix-broken",
          "scenario": "fix",
          "passed": true,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "chat-edit-invoice",
          "scenario": "chat-edit",
          "passed": true,
          "cyclesUsed": 4,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        }
      ],
      "narrative": "Perfect score with no content errors, but this model rarely converges in one shot — it averaged 3 cycles across all tasks, hitting 4 on both the CV and chat-edit runs. No observable failure patterns in table authoring or template variable handling; every pass was clean. Reliable but iterative: expect it to self-correct rather than nail complex layouts on the first attempt.",
      "narrativeModel": "openrouter-claude-sonnet:anthropic/claude-sonnet-4.6",
      "narrativeCostUSD": 0.004437
    },
    {
      "provider": "openrouter-qwen3",
      "model": "qwen/qwen3.5-122b-a10b",
      "totalTests": 6,
      "passCount": 6,
      "renderCount": 6,
      "cleanRate": 1,
      "avgCyclesUsed": 2.5,
      "avgLatencyMs": 21584,
      "totalInTokens": 395204,
      "totalOutTokens": 30604,
      "meanFirstAttemptSkill": 0.9895833333333334,
      "skillRows": 6,
      "runCostUSD": 0.243508,
      "outputPricePerMTok": 1.5,
      "skillModules": {
        "tableAuthoring": {
          "meanScore": 0.975,
          "applicableRows": 5
        },
        "templateVars": {
          "meanScore": 1,
          "applicableRows": 6
        }
      },
      "perTest": [
        {
          "test": "generate-invoice",
          "scenario": "generate",
          "passed": true,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "adapt-invoice",
          "scenario": "adapt",
          "passed": true,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "paginate-invoice",
          "scenario": "paginate",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "generate-cv",
          "scenario": "cv",
          "passed": true,
          "cyclesUsed": 5,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "fix-broken",
          "scenario": "fix",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 0.9375
        },
        {
          "test": "chat-edit-invoice",
          "scenario": "chat-edit",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        }
      ],
      "narrative": "Perfect pass rate with near-flawless first-attempt skill, but convergence is uneven — the CV took 5 cycles while simpler tasks landed in 1. The one recurring content slip is a T2 column-width mismatch: labelling a header as a stretch column (e.g. \"Metric\") without declaring a corresponding `1fr`/`auto-stretch` column, leaving surplus space unabsorbed. Otherwise unremarkable in its failure modes.",
      "narrativeModel": "openrouter-claude-sonnet:anthropic/claude-sonnet-4.6",
      "narrativeCostUSD": 0.008649
    },
    {
      "provider": "openrouter-glm-46",
      "model": "z-ai/glm-4.6",
      "totalTests": 6,
      "passCount": 6,
      "renderCount": 6,
      "cleanRate": 1,
      "avgCyclesUsed": 2.5,
      "avgLatencyMs": 128250,
      "totalInTokens": 376340,
      "totalOutTokens": 28540,
      "meanFirstAttemptSkill": 0.9895833333333334,
      "skillRows": 6,
      "runCostUSD": 0.2009986,
      "outputPricePerMTok": 1.9,
      "skillModules": {
        "tableAuthoring": {
          "meanScore": 0.975,
          "applicableRows": 5
        },
        "templateVars": {
          "meanScore": 1,
          "applicableRows": 6
        }
      },
      "perTest": [
        {
          "test": "generate-invoice",
          "scenario": "generate",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "adapt-invoice",
          "scenario": "adapt",
          "passed": true,
          "cyclesUsed": 4,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "paginate-invoice",
          "scenario": "paginate",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "generate-cv",
          "scenario": "cv",
          "passed": true,
          "cyclesUsed": 5,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "fix-broken",
          "scenario": "fix",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 0.9375
        },
        {
          "test": "chat-edit-invoice",
          "scenario": "chat-edit",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        }
      ],
      "narrative": "Passes everything cleanly, but convergence is uneven: CV generation needed 5 cycles and invoice adaptation 4, suggesting the model overshoots on layout complexity and self-corrects rather than landing right first. The one recurring table slip is declaring a stretch column header (e.g. \"Metric\") without assigning a matching `1fr`/`auto-stretch` column to absorb surplus width. Template variable handling is flawless and simpler documents close in one shot.",
      "narrativeModel": "openrouter-claude-sonnet:anthropic/claude-sonnet-4.6",
      "narrativeCostUSD": 0.008397
    },
    {
      "provider": "openrouter-deepseek-v4",
      "model": "deepseek/deepseek-v4-pro",
      "totalTests": 6,
      "passCount": 5,
      "renderCount": 6,
      "cleanRate": 0.8333333333333334,
      "avgCyclesUsed": 2.5,
      "avgLatencyMs": 63608,
      "totalInTokens": 387350,
      "totalOutTokens": 40512,
      "meanFirstAttemptSkill": 0.9895833333333334,
      "skillRows": 6,
      "runCostUSD": 0.20374269,
      "outputPricePerMTok": 0.87,
      "skillModules": {
        "tableAuthoring": {
          "meanScore": 0.975,
          "applicableRows": 5
        },
        "templateVars": {
          "meanScore": 1,
          "applicableRows": 6
        }
      },
      "perTest": [
        {
          "test": "generate-invoice",
          "scenario": "generate",
          "passed": true,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "adapt-invoice",
          "scenario": "adapt",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "paginate-invoice",
          "scenario": "paginate",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "generate-cv",
          "scenario": "cv",
          "passed": false,
          "cyclesUsed": 5,
          "catalogErrors": 3,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": "content",
          "firstAttemptScore": 1
        },
        {
          "test": "fix-broken",
          "scenario": "fix",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 0.9375
        },
        {
          "test": "chat-edit-invoice",
          "scenario": "chat-edit",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        }
      ],
      "narrative": "Strong across invoice tasks, with template variables handled perfectly throughout. The CV generation is the notable weak spot — it burned 5 cycles and 3 errors before still failing, suggesting persistent trouble authoring that document structure rather than a one-off slip. The single table warning reflects a consistent pattern of declaring stretch column headers without providing a matching `1fr`/`auto-stretch` column to absorb surplus width.",
      "narrativeModel": "openrouter-claude-sonnet:anthropic/claude-sonnet-4.6",
      "narrativeCostUSD": 0.006591
    },
    {
      "provider": "openrouter-kimi-k2",
      "model": "moonshotai/kimi-k2",
      "totalTests": 6,
      "passCount": 3,
      "renderCount": 3,
      "cleanRate": 0.5,
      "avgCyclesUsed": 2.6666666666666665,
      "avgLatencyMs": 19467,
      "totalInTokens": 388381,
      "totalOutTokens": 14289,
      "meanFirstAttemptSkill": 1,
      "skillRows": 3,
      "runCostUSD": 0.25424187,
      "outputPricePerMTok": 2.3,
      "skillModules": {
        "tableAuthoring": {
          "meanScore": 1,
          "applicableRows": 3
        },
        "templateVars": {
          "meanScore": 1,
          "applicableRows": 3
        }
      },
      "perTest": [
        {
          "test": "generate-invoice",
          "scenario": "generate",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "adapt-invoice",
          "scenario": "adapt",
          "passed": true,
          "cyclesUsed": 4,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "paginate-invoice",
          "scenario": "paginate",
          "passed": false,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": "content",
          "firstAttemptScore": null
        },
        {
          "test": "generate-cv",
          "scenario": "cv",
          "passed": false,
          "cyclesUsed": 4,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": "content",
          "firstAttemptScore": null
        },
        {
          "test": "fix-broken",
          "scenario": "fix",
          "passed": false,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": "content",
          "firstAttemptScore": null
        },
        {
          "test": "chat-edit-invoice",
          "scenario": "chat-edit",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        }
      ],
      "narrative": "Handles routine invoice generation and editing reliably, but fails content-side on pagination, CV layout, and broken-document repair — suggesting it loses the thread when structural complexity increases beyond a flat table. The adapt task needed 4 cycles to converge (with a warning), and the CV likewise burned 4 cycles before ultimately failing. No transport issues; all three failures are the model's own output.",
      "narrativeModel": "openrouter-claude-sonnet:anthropic/claude-sonnet-4.6",
      "narrativeCostUSD": 0.008718
    },
    {
      "provider": "openrouter-gpt5-1-codex-mini",
      "model": "openai/gpt-5.1-codex-mini",
      "totalTests": 6,
      "passCount": 5,
      "renderCount": 6,
      "cleanRate": 0.8333333333333334,
      "avgCyclesUsed": 2.5,
      "avgLatencyMs": 25634,
      "totalInTokens": 381513,
      "totalOutTokens": 76441,
      "meanFirstAttemptSkill": 1,
      "skillRows": 6,
      "runCostUSD": 0.24826025,
      "outputPricePerMTok": 2,
      "skillModules": {
        "tableAuthoring": {
          "meanScore": 1,
          "applicableRows": 5
        },
        "templateVars": {
          "meanScore": 1,
          "applicableRows": 6
        }
      },
      "perTest": [
        {
          "test": "generate-invoice",
          "scenario": "generate",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "adapt-invoice",
          "scenario": "adapt",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "paginate-invoice",
          "scenario": "paginate",
          "passed": true,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "generate-cv",
          "scenario": "cv",
          "passed": false,
          "cyclesUsed": 5,
          "catalogErrors": 10,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": "content",
          "firstAttemptScore": 1
        },
        {
          "test": "fix-broken",
          "scenario": "fix",
          "passed": true,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "chat-edit-invoice",
          "scenario": "chat-edit",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 2,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        }
      ],
      "narrative": "Handles table authoring and template variables cleanly across all tested formats, but stumbles hard on CV generation — burning through 5 cycles and accumulating 10 content errors without resolving them, suggesting a systematic problem with that document schema rather than a one-off miss. The remaining tests trend toward multi-cycle convergence (pagination and fix-broken each needed 3 passes), so first-attempt reliability is lower than the pass rate implies.",
      "narrativeModel": "openrouter-claude-sonnet:anthropic/claude-sonnet-4.6",
      "narrativeCostUSD": 0.007407
    },
    {
      "provider": "openrouter-qwen3-32b",
      "model": "qwen/qwen3-32b",
      "totalTests": 6,
      "passCount": 3,
      "renderCount": 4,
      "cleanRate": 0.5,
      "avgCyclesUsed": 2.8333333333333335,
      "avgLatencyMs": 62008,
      "totalInTokens": 425669,
      "totalOutTokens": 63960,
      "meanFirstAttemptSkill": 0.9333333333333333,
      "skillRows": 5,
      "runCostUSD": 0.051962320000000006,
      "outputPricePerMTok": 0.28,
      "skillModules": {
        "tableAuthoring": {
          "meanScore": 1,
          "applicableRows": 4
        },
        "templateVars": {
          "meanScore": 0.8666666666666668,
          "applicableRows": 5
        }
      },
      "perTest": [
        {
          "test": "generate-invoice",
          "scenario": "generate",
          "passed": false,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": "content",
          "firstAttemptScore": 1
        },
        {
          "test": "adapt-invoice",
          "scenario": "adapt",
          "passed": true,
          "cyclesUsed": 4,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 0.6666666666666667
        },
        {
          "test": "paginate-invoice",
          "scenario": "paginate",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "generate-cv",
          "scenario": "cv",
          "passed": false,
          "cyclesUsed": 5,
          "catalogErrors": 1,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": "content",
          "firstAttemptScore": 1
        },
        {
          "test": "fix-broken",
          "scenario": "fix",
          "passed": false,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": "content",
          "firstAttemptScore": null
        },
        {
          "test": "chat-edit-invoice",
          "scenario": "chat-edit",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        }
      ],
      "narrative": "Strong initial instincts (meanFirstAttemptSkill 0.93, perfect table authoring) but fails to close: both generate-invoice and generate-cv score skill=1 yet still fail after 3 and 5 cycles respectively, suggesting the model produces structurally valid DSL that quietly violates catalog or render constraints it doesn't catch itself. The V1 template-var failure — emitting `{{notes}}` against sampleData that has no such key — is characteristic: it hallucinates plausible-sounding variable names rather than grounding against actual schema. fix-broken returned null skill, indicating it couldn't diagnose the existing breakage at all.",
      "narrativeModel": "openrouter-claude-sonnet:anthropic/claude-sonnet-4.6",
      "narrativeCostUSD": 0.012417
    },
    {
      "provider": "openrouter-claude-opus",
      "model": "anthropic/claude-opus-4.7",
      "totalTests": 6,
      "passCount": 6,
      "renderCount": 6,
      "cleanRate": 1,
      "avgCyclesUsed": 1.8333333333333333,
      "avgLatencyMs": 19860,
      "totalInTokens": 432067,
      "totalOutTokens": 27709,
      "meanFirstAttemptSkill": 0.9895833333333334,
      "skillRows": 6,
      "runCostUSD": 2.85306,
      "outputPricePerMTok": 25,
      "skillModules": {
        "tableAuthoring": {
          "meanScore": 0.9791666666666666,
          "applicableRows": 6
        },
        "templateVars": {
          "meanScore": 1,
          "applicableRows": 6
        }
      },
      "perTest": [
        {
          "test": "generate-invoice",
          "scenario": "generate",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "adapt-invoice",
          "scenario": "adapt",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "paginate-invoice",
          "scenario": "paginate",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "generate-cv",
          "scenario": "cv",
          "passed": true,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "fix-broken",
          "scenario": "fix",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 0.9375
        },
        {
          "test": "chat-edit-invoice",
          "scenario": "chat-edit",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        }
      ],
      "narrative": "Perfect pass rate with near-flawless first-attempt skill, but it consistently needs extra cycles to converge — chat-edit burned 4 passes, CV authoring 3. The one recurring content slip is a T2 table misconfiguration: it declared a stretch column header without assigning a `1fr`/`auto-stretch` column to actually absorb the surplus width. Otherwise unremarkable in its failure modes.",
      "narrativeModel": "openrouter-claude-sonnet:anthropic/claude-sonnet-4.6",
      "narrativeCostUSD": 0.009339
    },
    {
      "provider": "openrouter-gpt5-5",
      "model": "openai/gpt-5.5",
      "totalTests": 6,
      "passCount": 6,
      "renderCount": 6,
      "cleanRate": 1,
      "avgCyclesUsed": 1.8333333333333333,
      "avgLatencyMs": 25391,
      "totalInTokens": 281571,
      "totalOutTokens": 21076,
      "meanFirstAttemptSkill": 0.9895833333333334,
      "skillRows": 6,
      "runCostUSD": 2.040135,
      "outputPricePerMTok": 30,
      "skillModules": {
        "tableAuthoring": {
          "meanScore": 0.975,
          "applicableRows": 5
        },
        "templateVars": {
          "meanScore": 1,
          "applicableRows": 6
        }
      },
      "perTest": [
        {
          "test": "generate-invoice",
          "scenario": "generate",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "adapt-invoice",
          "scenario": "adapt",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "paginate-invoice",
          "scenario": "paginate",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "generate-cv",
          "scenario": "cv",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "fix-broken",
          "scenario": "fix",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 0.9375
        },
        {
          "test": "chat-edit-invoice",
          "scenario": "chat-edit",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        }
      ],
      "narrative": "Near-flawless across all tests, with the only content blemish being a T2 warning where a \"Metric\" stretch column header was declared without a corresponding `1fr`/`auto` column to absorb surplus space. The chat-edit task burned 4 cycles to converge — double the typical run — suggesting it over-iterates on interactive edits. Template variable handling is spotless.",
      "narrativeModel": "openrouter-claude-sonnet:anthropic/claude-sonnet-4.6",
      "narrativeCostUSD": 0.006417
    },
    {
      "provider": "openrouter-gpt5-4",
      "model": "openai/gpt-5.4",
      "totalTests": 6,
      "passCount": 6,
      "renderCount": 6,
      "cleanRate": 1,
      "avgCyclesUsed": 1.6666666666666667,
      "avgLatencyMs": 57711,
      "totalInTokens": 258266,
      "totalOutTokens": 32122,
      "meanFirstAttemptSkill": 0.9895833333333334,
      "skillRows": 6,
      "runCostUSD": 1.127495,
      "outputPricePerMTok": 15,
      "skillModules": {
        "tableAuthoring": {
          "meanScore": 0.975,
          "applicableRows": 5
        },
        "templateVars": {
          "meanScore": 1,
          "applicableRows": 6
        }
      },
      "perTest": [
        {
          "test": "generate-invoice",
          "scenario": "generate",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "adapt-invoice",
          "scenario": "adapt",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "paginate-invoice",
          "scenario": "paginate",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "generate-cv",
          "scenario": "cv",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "fix-broken",
          "scenario": "fix",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 0.9375
        },
        {
          "test": "chat-edit-invoice",
          "scenario": "chat-edit",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        }
      ],
      "narrative": "Near-perfect across all six tests, with flawless template variable substitution and clean renders every time. The one recurring slip is a T2 column-width mismatch — declaring a stretch column header (\"Metric\") without a corresponding `1fr`/`auto-stretch` column to absorb surplus space. The chat-edit task burned 4 cycles to converge, the only sign of iterative struggle in an otherwise efficient run.",
      "narrativeModel": "openrouter-claude-sonnet:anthropic/claude-sonnet-4.6",
      "narrativeCostUSD": 0.007797
    },
    {
      "provider": "openrouter-grok-4-20",
      "model": "x-ai/grok-4.20",
      "totalTests": 6,
      "passCount": 4,
      "renderCount": 6,
      "cleanRate": 0.6666666666666666,
      "avgCyclesUsed": 2.8333333333333335,
      "avgLatencyMs": 53771,
      "totalInTokens": 416687,
      "totalOutTokens": 91564,
      "meanFirstAttemptSkill": 0.9895833333333334,
      "skillRows": 6,
      "runCostUSD": 0.74976875,
      "outputPricePerMTok": 2.5,
      "skillModules": {
        "tableAuthoring": {
          "meanScore": 0.975,
          "applicableRows": 5
        },
        "templateVars": {
          "meanScore": 1,
          "applicableRows": 6
        }
      },
      "perTest": [
        {
          "test": "generate-invoice",
          "scenario": "generate",
          "passed": false,
          "cyclesUsed": 5,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": "content",
          "firstAttemptScore": 1
        },
        {
          "test": "adapt-invoice",
          "scenario": "adapt",
          "passed": false,
          "cyclesUsed": 5,
          "catalogErrors": 0,
          "catalogWarnings": 2,
          "error": null,
          "failureKind": "content",
          "firstAttemptScore": 1
        },
        {
          "test": "paginate-invoice",
          "scenario": "paginate",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "generate-cv",
          "scenario": "cv",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "fix-broken",
          "scenario": "fix",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 0.9375
        },
        {
          "test": "chat-edit-invoice",
          "scenario": "chat-edit",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        }
      ],
      "narrative": "Both failures share the same root cause: the model repeatedly declares a stretch-labelled column header (\"Metric\") without assigning the corresponding column a `1fr`/`auto`/`auto-stretch` width — and it never self-corrects across five cycles on each invoice task. Everything renders cleanly and template variable handling is flawless, so the drag is entirely this one persistent T2 misconfiguration in table layout.",
      "narrativeModel": "openrouter-claude-sonnet:anthropic/claude-sonnet-4.6",
      "narrativeCostUSD": 0.008901
    },
    {
      "provider": "openrouter-grok-4-fast",
      "model": "x-ai/grok-4-fast",
      "totalTests": 6,
      "passCount": 6,
      "renderCount": 6,
      "cleanRate": 1,
      "avgCyclesUsed": 1.8333333333333333,
      "avgLatencyMs": 52658,
      "totalInTokens": 276509,
      "totalOutTokens": 47018,
      "meanFirstAttemptSkill": 0.9791666666666666,
      "skillRows": 6,
      "runCostUSD": 0.0788108,
      "outputPricePerMTok": 0.5,
      "skillModules": {
        "tableAuthoring": {
          "meanScore": 0.95,
          "applicableRows": 5
        },
        "templateVars": {
          "meanScore": 1,
          "applicableRows": 6
        }
      },
      "perTest": [
        {
          "test": "generate-invoice",
          "scenario": "generate",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "adapt-invoice",
          "scenario": "adapt",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "paginate-invoice",
          "scenario": "paginate",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "generate-cv",
          "scenario": "cv",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "fix-broken",
          "scenario": "fix",
          "passed": true,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 0.875
        },
        {
          "test": "chat-edit-invoice",
          "scenario": "chat-edit",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        }
      ],
      "narrative": "Perfect pass rate with near-flawless first attempts, but table layout trips it up consistently: it declares stretch column headers (T2) without a matching `1fr`/`auto-stretch` column to absorb surplus width, and occasionally emits rows with fewer cells than the table has columns rather than using `colspan` (T4). The `fix-broken` task needed three cycles and still left a warning; `chat-edit` took four cycles to converge — both suggesting iterative correction rather than clean-shot repair on complex editing tasks.",
      "narrativeModel": "openrouter-claude-sonnet:anthropic/claude-sonnet-4.6",
      "narrativeCostUSD": 0.010098
    },
    {
      "provider": "openrouter-glm-47",
      "model": "z-ai/glm-4.7",
      "totalTests": 6,
      "passCount": 5,
      "renderCount": 6,
      "cleanRate": 0.8333333333333334,
      "avgCyclesUsed": 3,
      "avgLatencyMs": 150479,
      "totalInTokens": 448026,
      "totalOutTokens": 94671,
      "meanFirstAttemptSkill": 0.9895833333333334,
      "skillRows": 6,
      "runCostUSD": 0.34488465,
      "outputPricePerMTok": 1.75,
      "skillModules": {
        "tableAuthoring": {
          "meanScore": 0.975,
          "applicableRows": 5
        },
        "templateVars": {
          "meanScore": 1,
          "applicableRows": 6
        }
      },
      "perTest": [
        {
          "test": "generate-invoice",
          "scenario": "generate",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "adapt-invoice",
          "scenario": "adapt",
          "passed": false,
          "cyclesUsed": 5,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": "content",
          "firstAttemptScore": 1
        },
        {
          "test": "paginate-invoice",
          "scenario": "paginate",
          "passed": true,
          "cyclesUsed": 4,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "generate-cv",
          "scenario": "cv",
          "passed": true,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "fix-broken",
          "scenario": "fix",
          "passed": true,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 0.9375
        },
        {
          "test": "chat-edit-invoice",
          "scenario": "chat-edit",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        }
      ],
      "narrative": "Strong semantic accuracy throughout — skill scores stay near perfect even where it fails — but it burns cycles iterating toward the finish line, averaging 3.5 per test and spending 5 cycles on the one outright failure. That content failure in `adapt-invoice` traces to a T2 violation: it declared a stretch-labelled column header (\"Metric\") without assigning a corresponding `1fr`/`auto-stretch` column definition to absorb surplus width, a structural column-layout mistake it never self-corrected.",
      "narrativeModel": "openrouter-claude-sonnet:anthropic/claude-sonnet-4.6",
      "narrativeCostUSD": 0.009999
    },
    {
      "provider": "openrouter-kimi-k2-6",
      "model": "moonshotai/kimi-k2.6",
      "totalTests": 6,
      "passCount": 6,
      "renderCount": 6,
      "cleanRate": 1,
      "avgCyclesUsed": 2,
      "avgLatencyMs": 464425,
      "totalInTokens": 298829,
      "totalOutTokens": 126422,
      "meanFirstAttemptSkill": 1,
      "skillRows": 6,
      "runCostUSD": 0.66361046,
      "outputPricePerMTok": 3.5,
      "skillModules": {
        "tableAuthoring": {
          "meanScore": 1,
          "applicableRows": 5
        },
        "templateVars": {
          "meanScore": 1,
          "applicableRows": 6
        }
      },
      "perTest": [
        {
          "test": "generate-invoice",
          "scenario": "generate",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "paginate-invoice",
          "scenario": "paginate",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "chat-edit-invoice",
          "scenario": "chat-edit",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "generate-cv",
          "scenario": "cv",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "fix-broken",
          "scenario": "fix",
          "passed": true,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "adapt-invoice",
          "scenario": "adapt",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        }
      ],
      "narrative": "Perfect score across all tasks with no errors or warnings. The fix-broken case needed 3 cycles to converge, suggesting the model required a couple of correction rounds before producing a clean repair, but every other task settled in 1-2. Unremarkable in terms of failure patterns — there are none to report.",
      "narrativeModel": "openrouter-claude-sonnet:anthropic/claude-sonnet-4.6",
      "narrativeCostUSD": 0.004254
    },
    {
      "provider": "openrouter-deepseek-v4-flash",
      "model": "deepseek/deepseek-v4-flash",
      "totalTests": 6,
      "passCount": 6,
      "renderCount": 6,
      "cleanRate": 1,
      "avgCyclesUsed": 2,
      "avgLatencyMs": 32509,
      "totalInTokens": 317255,
      "totalOutTokens": 27682,
      "meanFirstAttemptSkill": 0.9895833333333334,
      "skillRows": 6,
      "runCostUSD": 0.052166660000000004,
      "outputPricePerMTok": 0.28,
      "skillModules": {
        "tableAuthoring": {
          "meanScore": 0.975,
          "applicableRows": 5
        },
        "templateVars": {
          "meanScore": 1,
          "applicableRows": 6
        }
      },
      "perTest": [
        {
          "test": "generate-invoice",
          "scenario": "generate",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "adapt-invoice",
          "scenario": "adapt",
          "passed": true,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 2,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "paginate-invoice",
          "scenario": "paginate",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "generate-cv",
          "scenario": "cv",
          "passed": true,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "fix-broken",
          "scenario": "fix",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 0.9375
        },
        {
          "test": "chat-edit-invoice",
          "scenario": "chat-edit",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        }
      ],
      "narrative": "Perfect pass rate, but this model rarely nails layout on the first attempt — it burns multiple cycles on adaptation, CV generation, and chat-editing tasks (up to 4), suggesting it over-generates or mis-sequences structural decisions before self-correcting. The single content imperfection is a T2 column-width mismatch: it labelled a header as stretch but failed to assign a `1fr`/`auto-stretch` column to absorb surplus space. Template variable substitution is flawless throughout.",
      "narrativeModel": "openrouter-claude-sonnet:anthropic/claude-sonnet-4.6",
      "narrativeCostUSD": 0.006945
    },
    {
      "provider": "openrouter-qwen3-6-max",
      "model": "qwen/qwen3.6-max-preview",
      "totalTests": 6,
      "passCount": 4,
      "renderCount": 6,
      "cleanRate": 0.6666666666666666,
      "avgCyclesUsed": 2.8333333333333335,
      "avgLatencyMs": 146952,
      "totalInTokens": 444352,
      "totalOutTokens": 82797,
      "meanFirstAttemptSkill": 0.9895833333333334,
      "skillRows": 6,
      "runCostUSD": 0.9787793600000001,
      "outputPricePerMTok": 6.24,
      "skillModules": {
        "tableAuthoring": {
          "meanScore": 0.975,
          "applicableRows": 5
        },
        "templateVars": {
          "meanScore": 1,
          "applicableRows": 6
        }
      },
      "perTest": [
        {
          "test": "generate-invoice",
          "scenario": "generate",
          "passed": false,
          "cyclesUsed": 5,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": "content",
          "firstAttemptScore": 1
        },
        {
          "test": "adapt-invoice",
          "scenario": "adapt",
          "passed": true,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "paginate-invoice",
          "scenario": "paginate",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "chat-edit-invoice",
          "scenario": "chat-edit",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "generate-cv",
          "scenario": "cv",
          "passed": false,
          "cyclesUsed": 5,
          "catalogErrors": 1,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": "content",
          "firstAttemptScore": 1
        },
        {
          "test": "fix-broken",
          "scenario": "fix",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 0.9375
        }
      ],
      "narrative": "Template variable handling is flawless and overall DSL knowledge is high, but the model failed to close on a T2 column-width mismatch in invoice generation — it burned 5 cycles without ever adding the required `1fr`/`auto` column to back a stretch header, ultimately failing the test despite zero errors. The same warning surfaced in the adapt run but didn't block passage there. One CV request failed in transit and should not be attributed to the model.",
      "narrativeModel": "openrouter-claude-sonnet:anthropic/claude-sonnet-4.6",
      "narrativeCostUSD": 0.01023
    },
    {
      "provider": "openrouter-llama4-maverick",
      "model": "meta-llama/llama-4-maverick",
      "totalTests": 6,
      "passCount": 5,
      "renderCount": 5,
      "cleanRate": 0.8333333333333334,
      "avgCyclesUsed": 2,
      "avgLatencyMs": 23029,
      "totalInTokens": 305306,
      "totalOutTokens": 14375,
      "meanFirstAttemptSkill": 0.9875,
      "skillRows": 5,
      "runCostUSD": 0.0544209,
      "outputPricePerMTok": 0.6,
      "skillModules": {
        "tableAuthoring": {
          "meanScore": 0.975,
          "applicableRows": 5
        },
        "templateVars": {
          "meanScore": 1,
          "applicableRows": 5
        }
      },
      "perTest": [
        {
          "test": "generate-invoice",
          "scenario": "generate",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "adapt-invoice",
          "scenario": "adapt",
          "passed": true,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "paginate-invoice",
          "scenario": "paginate",
          "passed": true,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "generate-cv",
          "scenario": "cv",
          "passed": false,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": "content",
          "firstAttemptScore": null
        },
        {
          "test": "fix-broken",
          "scenario": "fix",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 0.9375
        },
        {
          "test": "chat-edit-invoice",
          "scenario": "chat-edit",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        }
      ],
      "narrative": "Strong on template variable handling and invoice tasks, but burns extra cycles converging — the chat-edit test took 4 cycles and two invoice tests needed 3 each. The sole content failure is on CV generation, where output was wrong enough to not score at all. Recurring table issue: declaring a stretch column header (e.g. \"Metric\") without a corresponding `1fr`/`auto-stretch` column to actually absorb the surplus space.",
      "narrativeModel": "openrouter-claude-sonnet:anthropic/claude-sonnet-4.6",
      "narrativeCostUSD": 0.008418
    },
    {
      "provider": "openrouter-mistral-medium",
      "model": "mistralai/mistral-medium-3-5",
      "totalTests": 6,
      "passCount": 5,
      "renderCount": 5,
      "cleanRate": 0.8333333333333334,
      "avgCyclesUsed": 2.5,
      "avgLatencyMs": 7954,
      "totalInTokens": 393313,
      "totalOutTokens": 18954,
      "meanFirstAttemptSkill": 1,
      "skillRows": 6,
      "runCostUSD": 0.7321245,
      "outputPricePerMTok": 7.5,
      "skillModules": {
        "tableAuthoring": {
          "meanScore": 1,
          "applicableRows": 5
        },
        "templateVars": {
          "meanScore": 1,
          "applicableRows": 6
        }
      },
      "perTest": [
        {
          "test": "generate-invoice",
          "scenario": "generate",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "adapt-invoice",
          "scenario": "adapt",
          "passed": true,
          "cyclesUsed": 2,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "paginate-invoice",
          "scenario": "paginate",
          "passed": true,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "generate-cv",
          "scenario": "cv",
          "passed": false,
          "cyclesUsed": 5,
          "catalogErrors": 1,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": "content",
          "firstAttemptScore": 1
        },
        {
          "test": "fix-broken",
          "scenario": "fix",
          "passed": true,
          "cyclesUsed": 3,
          "catalogErrors": 0,
          "catalogWarnings": 1,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        },
        {
          "test": "chat-edit-invoice",
          "scenario": "chat-edit",
          "passed": true,
          "cyclesUsed": 1,
          "catalogErrors": 0,
          "catalogWarnings": 0,
          "error": null,
          "failureKind": null,
          "firstAttemptScore": 1
        }
      ],
      "narrative": "Handles invoicing tasks reliably, though it rarely lands cleanly on the first pass — pagination and chat-editing both needed 3–4 cycles to converge. The CV generation is the standout failure: it burned all 5 cycles and still couldn't produce a passing document, suggesting it gets trapped in a correction loop on more structurally complex layouts without making meaningful forward progress.",
      "narrativeModel": "openrouter-claude-sonnet:anthropic/claude-sonnet-4.6",
      "narrativeCostUSD": 0.006057
    }
  ],
  "rows": [
    {
      "provider": "openrouter-claude-sonnet",
      "model": "anthropic/claude-sonnet-4.6",
      "test": "generate-invoice",
      "scenario": "generate",
      "runStartedAt": 1778567134383,
      "latencyMs": 42317,
      "inputTokens": 45332,
      "outputTokens": 6364,
      "outputChars": 3235,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 35
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-claude-haiku",
      "model": "anthropic/claude-haiku-4.5",
      "test": "generate-invoice",
      "scenario": "generate",
      "runStartedAt": 1778567134383,
      "latencyMs": 26751,
      "inputTokens": 45352,
      "outputTokens": 9650,
      "outputChars": 2729,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 34
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-gpt5",
      "model": "openai/gpt-5",
      "test": "generate-invoice",
      "scenario": "generate",
      "runStartedAt": 1778567134383,
      "latencyMs": 35294,
      "inputTokens": 38976,
      "outputTokens": 5474,
      "outputChars": 2748,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 35
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-gpt5-mini",
      "model": "openai/gpt-5-mini",
      "test": "generate-invoice",
      "scenario": "generate",
      "runStartedAt": 1778567134383,
      "latencyMs": 19801,
      "inputTokens": 38949,
      "outputTokens": 5182,
      "outputChars": 3102,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 35
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-gpt5-4-mini",
      "model": "openai/gpt-5.4-mini",
      "test": "generate-invoice",
      "scenario": "generate",
      "runStartedAt": 1778567134383,
      "latencyMs": 13945,
      "inputTokens": 39195,
      "outputTokens": 6904,
      "outputChars": 3754,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 35
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-gpt5-4-nano",
      "model": "openai/gpt-5.4-nano",
      "test": "generate-invoice",
      "scenario": "generate",
      "runStartedAt": 1778567134383,
      "latencyMs": 34115,
      "inputTokens": 39081,
      "outputTokens": 6163,
      "outputChars": 3090,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 35
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-gemini-pro",
      "model": "google/gemini-2.5-pro",
      "test": "generate-invoice",
      "scenario": "generate",
      "runStartedAt": 1778567134383,
      "latencyMs": 24944,
      "inputTokens": 67079,
      "outputTokens": 12276,
      "outputChars": 3222,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 34
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 3
    },
    {
      "provider": "openrouter-grok",
      "model": "x-ai/grok-4",
      "test": "generate-invoice",
      "scenario": "generate",
      "runStartedAt": 1778567134383,
      "latencyMs": 325130,
      "inputTokens": 61016,
      "outputTokens": 12965,
      "outputChars": 2689,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 34
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 3
    },
    {
      "provider": "openrouter-qwen3",
      "model": "qwen/qwen3.5-122b-a10b",
      "test": "generate-invoice",
      "scenario": "generate",
      "runStartedAt": 1778567134383,
      "latencyMs": 13324,
      "inputTokens": 64404,
      "outputTokens": 4850,
      "outputChars": 2676,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 35
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 3
    },
    {
      "provider": "openrouter-glm-46",
      "model": "z-ai/glm-4.6",
      "test": "generate-invoice",
      "scenario": "generate",
      "runStartedAt": 1778567134383,
      "latencyMs": 50731,
      "inputTokens": 19089,
      "outputTokens": 1060,
      "outputChars": 2583,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 35
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1
    },
    {
      "provider": "openrouter-deepseek-v4",
      "model": "deepseek/deepseek-v4-pro",
      "test": "generate-invoice",
      "scenario": "generate",
      "runStartedAt": 1778567134383,
      "latencyMs": 74028,
      "inputTokens": 62358,
      "outputTokens": 7742,
      "outputChars": 2840,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 35
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 3
    },
    {
      "provider": "openrouter-kimi-k2",
      "model": "moonshotai/kimi-k2",
      "test": "generate-invoice",
      "scenario": "generate",
      "runStartedAt": 1778567134383,
      "latencyMs": 21987,
      "inputTokens": 38770,
      "outputTokens": 1615,
      "outputChars": 2647,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 35
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-gpt5-1-codex-mini",
      "model": "openai/gpt-5.1-codex-mini",
      "test": "generate-invoice",
      "scenario": "generate",
      "runStartedAt": 1778567134383,
      "latencyMs": 23531,
      "inputTokens": 39048,
      "outputTokens": 6739,
      "outputChars": 2803,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 34
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-qwen3-32b",
      "model": "qwen/qwen3-32b",
      "test": "generate-invoice",
      "scenario": "generate",
      "runStartedAt": 1778567134383,
      "latencyMs": 94748,
      "inputTokens": 62127,
      "outputTokens": 8862,
      "outputChars": 2968,
      "valid": false,
      "dslParsed": false,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [
        "DSL execution failed: DSL execution failed: Unterminated string constant (74:8)\n  |   date: \"31 March  witnessed\n  |         ^",
        "Missing const template = doc(...)",
        "Missing const sampleData = {...}"
      ],
      "rendered": null,
      "renderError": null,
      "error": null,
      "cyclesUsed": 3,
      "cleanReached": false
    },
    {
      "provider": "openrouter-claude-sonnet",
      "model": "anthropic/claude-sonnet-4.6",
      "test": "adapt-invoice",
      "scenario": "adapt",
      "runStartedAt": 1778567134383,
      "latencyMs": 140632,
      "inputTokens": 46919,
      "outputTokens": 14153,
      "outputChars": 2646,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 34
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-claude-haiku",
      "model": "anthropic/claude-haiku-4.5",
      "test": "adapt-invoice",
      "scenario": "adapt",
      "runStartedAt": 1778567134383,
      "latencyMs": 25049,
      "inputTokens": 72225,
      "outputTokens": 18719,
      "outputChars": 2550,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 33
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 3
    },
    {
      "provider": "openrouter-gpt5",
      "model": "openai/gpt-5",
      "test": "adapt-invoice",
      "scenario": "adapt",
      "runStartedAt": 1778567134383,
      "latencyMs": 90804,
      "inputTokens": 40371,
      "outputTokens": 6177,
      "outputChars": 2728,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 33
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-gpt5-mini",
      "model": "openai/gpt-5-mini",
      "test": "adapt-invoice",
      "scenario": "adapt",
      "runStartedAt": 1778567134383,
      "latencyMs": 18104,
      "inputTokens": 40384,
      "outputTokens": 4482,
      "outputChars": 2679,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 33
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-gpt5-4-mini",
      "model": "openai/gpt-5.4-mini",
      "test": "adapt-invoice",
      "scenario": "adapt",
      "runStartedAt": 1778567134383,
      "latencyMs": 20582,
      "inputTokens": 62231,
      "outputTokens": 9545,
      "outputChars": 2767,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 34
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 3
    },
    {
      "provider": "openrouter-gpt5-4-nano",
      "model": "openai/gpt-5.4-nano",
      "test": "adapt-invoice",
      "scenario": "adapt",
      "runStartedAt": 1778567134383,
      "latencyMs": 22096,
      "inputTokens": 40352,
      "outputTokens": 3742,
      "outputChars": 3137,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 34
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-gemini-pro",
      "model": "google/gemini-2.5-pro",
      "test": "adapt-invoice",
      "scenario": "adapt",
      "runStartedAt": 1778567134383,
      "latencyMs": 28681,
      "inputTokens": 69165,
      "outputTokens": 17158,
      "outputChars": 2538,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 2,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 34
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 3
    },
    {
      "provider": "openrouter-grok",
      "model": "x-ai/grok-4",
      "test": "adapt-invoice",
      "scenario": "adapt",
      "runStartedAt": 1778567134383,
      "latencyMs": 661885,
      "inputTokens": 41212,
      "outputTokens": 10980,
      "outputChars": 2971,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 34
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-qwen3",
      "model": "qwen/qwen3.5-122b-a10b",
      "test": "adapt-invoice",
      "scenario": "adapt",
      "runStartedAt": 1778567134383,
      "latencyMs": 10897,
      "inputTokens": 66892,
      "outputTokens": 4618,
      "outputChars": 3035,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 34
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 3
    },
    {
      "provider": "openrouter-glm-46",
      "model": "z-ai/glm-4.6",
      "test": "adapt-invoice",
      "scenario": "adapt",
      "runStartedAt": 1778567134383,
      "latencyMs": 48520,
      "inputTokens": 85570,
      "outputTokens": 5392,
      "outputChars": 2614,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 33
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 4
    },
    {
      "provider": "openrouter-deepseek-v4",
      "model": "deepseek/deepseek-v4-pro",
      "test": "adapt-invoice",
      "scenario": "adapt",
      "runStartedAt": 1778567134383,
      "latencyMs": 17290,
      "inputTokens": 20381,
      "outputTokens": 873,
      "outputChars": 2470,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 34
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1
    },
    {
      "provider": "openrouter-kimi-k2",
      "model": "moonshotai/kimi-k2",
      "test": "adapt-invoice",
      "scenario": "adapt",
      "runStartedAt": 1778567134383,
      "latencyMs": 21413,
      "inputTokens": 84162,
      "outputTokens": 3165,
      "outputChars": 2324,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 34
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 4
    },
    {
      "provider": "openrouter-gpt5-1-codex-mini",
      "model": "openai/gpt-5.1-codex-mini",
      "test": "adapt-invoice",
      "scenario": "adapt",
      "runStartedAt": 1778567134383,
      "latencyMs": 39466,
      "inputTokens": 19682,
      "outputTokens": 4501,
      "outputChars": 2657,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 33
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1
    },
    {
      "provider": "openrouter-qwen3-32b",
      "model": "qwen/qwen3-32b",
      "test": "adapt-invoice",
      "scenario": "adapt",
      "runStartedAt": 1778567134383,
      "latencyMs": 32193,
      "inputTokens": 88166,
      "outputTokens": 13187,
      "outputChars": 2690,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 33
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 4
    },
    {
      "provider": "openrouter-claude-sonnet",
      "model": "anthropic/claude-sonnet-4.6",
      "test": "paginate-invoice",
      "scenario": "paginate",
      "runStartedAt": 1778567134383,
      "latencyMs": 146718,
      "inputTokens": 24501,
      "outputTokens": 12781,
      "outputChars": 7982,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 2,
        "sizeKB": 58
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1
    },
    {
      "provider": "openrouter-claude-haiku",
      "model": "anthropic/claude-haiku-4.5",
      "test": "paginate-invoice",
      "scenario": "paginate",
      "runStartedAt": 1778567134383,
      "latencyMs": 30095,
      "inputTokens": 51917,
      "outputTokens": 20027,
      "outputChars": 6984,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 2,
        "sizeKB": 57
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-gpt5",
      "model": "openai/gpt-5",
      "test": "paginate-invoice",
      "scenario": "paginate",
      "runStartedAt": 1778567134383,
      "latencyMs": 148613,
      "inputTokens": 21187,
      "outputTokens": 7181,
      "outputChars": 9427,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 2,
        "sizeKB": 57
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1
    },
    {
      "provider": "openrouter-gpt5-mini",
      "model": "openai/gpt-5-mini",
      "test": "paginate-invoice",
      "scenario": "paginate",
      "runStartedAt": 1778567134383,
      "latencyMs": 42367,
      "inputTokens": 21187,
      "outputTokens": 5664,
      "outputChars": 7433,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 2,
        "sizeKB": 56
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1
    },
    {
      "provider": "openrouter-gpt5-4-mini",
      "model": "openai/gpt-5.4-mini",
      "test": "paginate-invoice",
      "scenario": "paginate",
      "runStartedAt": 1778567134383,
      "latencyMs": 27241,
      "inputTokens": 43331,
      "outputTokens": 12053,
      "outputChars": 2744,
      "valid": false,
      "dslParsed": false,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [
        "DSL execution failed: DSL execution failed: Cannot evaluate ForStatement",
        "Missing const template = doc(...)",
        "Missing const sampleData = {...}"
      ],
      "rendered": null,
      "renderError": null,
      "error": null,
      "cyclesUsed": 2,
      "cleanReached": false
    },
    {
      "provider": "openrouter-gpt5-4-nano",
      "model": "openai/gpt-5.4-nano",
      "test": "paginate-invoice",
      "scenario": "paginate",
      "runStartedAt": 1778567134383,
      "latencyMs": 52888,
      "inputTokens": 21187,
      "outputTokens": 7652,
      "outputChars": 7457,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 2,
        "sizeKB": 57
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1
    },
    {
      "provider": "openrouter-gemini-pro",
      "model": "google/gemini-2.5-pro",
      "test": "paginate-invoice",
      "scenario": "paginate",
      "runStartedAt": 1778567134383,
      "latencyMs": 54664,
      "inputTokens": 145878,
      "outputTokens": 43368,
      "outputChars": 6516,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 2,
        "sizeKB": 57
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 5
    },
    {
      "provider": "openrouter-grok",
      "model": "x-ai/grok-4",
      "test": "paginate-invoice",
      "scenario": "paginate",
      "runStartedAt": 1778567134383,
      "latencyMs": 86752,
      "inputTokens": 46013,
      "outputTokens": 12370,
      "outputChars": 8222,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 2,
        "sizeKB": 57
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-qwen3",
      "model": "qwen/qwen3.5-122b-a10b",
      "test": "paginate-invoice",
      "scenario": "paginate",
      "runStartedAt": 1778567134383,
      "latencyMs": 52027,
      "inputTokens": 23005,
      "outputTokens": 4073,
      "outputChars": 7172,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 2,
        "sizeKB": 55
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1
    },
    {
      "provider": "openrouter-glm-46",
      "model": "z-ai/glm-4.6",
      "test": "paginate-invoice",
      "scenario": "paginate",
      "runStartedAt": 1778567134383,
      "latencyMs": 68991,
      "inputTokens": 45351,
      "outputTokens": 5741,
      "outputChars": 7802,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 2,
        "sizeKB": 56
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-deepseek-v4",
      "model": "deepseek/deepseek-v4-pro",
      "test": "paginate-invoice",
      "scenario": "paginate",
      "runStartedAt": 1778567134383,
      "latencyMs": 120403,
      "inputTokens": 46539,
      "outputTokens": 8525,
      "outputChars": 7435,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 2,
        "sizeKB": 57
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-kimi-k2",
      "model": "moonshotai/kimi-k2",
      "test": "paginate-invoice",
      "scenario": "paginate",
      "runStartedAt": 1778567134383,
      "latencyMs": 17206,
      "inputTokens": 43423,
      "outputTokens": 1601,
      "outputChars": 1775,
      "valid": false,
      "dslParsed": false,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [
        "DSL execution failed: DSL execution failed: Unexpected token (59:42)\n  |   items: Array.from({ length: 50 }, (_, i)71400.00\",\n  |                                           ^",
        "Missing const template = doc(...)",
        "Missing const sampleData = {...}"
      ],
      "rendered": null,
      "renderError": null,
      "error": null,
      "cyclesUsed": 2,
      "cleanReached": false
    },
    {
      "provider": "openrouter-gpt5-1-codex-mini",
      "model": "openai/gpt-5.1-codex-mini",
      "test": "paginate-invoice",
      "scenario": "paginate",
      "runStartedAt": 1778567134383,
      "latencyMs": 39926,
      "inputTokens": 73349,
      "outputTokens": 31162,
      "outputChars": 9435,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 2,
        "sizeKB": 57
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 3
    },
    {
      "provider": "openrouter-qwen3-32b",
      "model": "qwen/qwen3-32b",
      "test": "paginate-invoice",
      "scenario": "paginate",
      "runStartedAt": 1778567134383,
      "latencyMs": 43045,
      "inputTokens": 44847,
      "outputTokens": 5473,
      "outputChars": 2334,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 33
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-claude-sonnet",
      "model": "anthropic/claude-sonnet-4.6",
      "test": "generate-cv",
      "scenario": "cv",
      "runStartedAt": 1778567134383,
      "latencyMs": 88701,
      "inputTokens": 45703,
      "outputTokens": 16416,
      "outputChars": 3970,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 33
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "templateVars"
        ],
        "modules": {
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-claude-haiku",
      "model": "anthropic/claude-haiku-4.5",
      "test": "generate-cv",
      "scenario": "cv",
      "runStartedAt": 1778567134383,
      "latencyMs": 91744,
      "inputTokens": 46078,
      "outputTokens": 28024,
      "outputChars": 3570,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 33
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "templateVars"
        ],
        "modules": {
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-gpt5",
      "model": "openai/gpt-5",
      "test": "generate-cv",
      "scenario": "cv",
      "runStartedAt": 1778567134383,
      "latencyMs": 34322,
      "inputTokens": 39006,
      "outputTokens": 5395,
      "outputChars": 3597,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-gpt5-mini",
      "model": "openai/gpt-5-mini",
      "test": "generate-cv",
      "scenario": "cv",
      "runStartedAt": 1778567134383,
      "latencyMs": 26743,
      "inputTokens": 39320,
      "outputTokens": 6567,
      "outputChars": 4379,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 33
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "templateVars"
        ],
        "modules": {
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-gpt5-4-mini",
      "model": "openai/gpt-5.4-mini",
      "test": "generate-cv",
      "scenario": "cv",
      "runStartedAt": 1778567134383,
      "latencyMs": 20346,
      "inputTokens": 39343,
      "outputTokens": 10415,
      "outputChars": 4619,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 33
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "templateVars"
        ],
        "modules": {
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-gpt5-4-nano",
      "model": "openai/gpt-5.4-nano",
      "test": "generate-cv",
      "scenario": "cv",
      "runStartedAt": 1778567134383,
      "latencyMs": 11117,
      "inputTokens": 61299,
      "outputTokens": 9263,
      "outputChars": 4124,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 33
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "templateVars"
        ],
        "modules": {
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 3
    },
    {
      "provider": "openrouter-gemini-pro",
      "model": "google/gemini-2.5-pro",
      "test": "generate-cv",
      "scenario": "cv",
      "runStartedAt": 1778567134383,
      "latencyMs": 118403,
      "inputTokens": 67055,
      "outputTokens": 19715,
      "outputChars": 3648,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 3
    },
    {
      "provider": "openrouter-grok",
      "model": "x-ai/grok-4",
      "test": "generate-cv",
      "scenario": "cv",
      "runStartedAt": 1778567134383,
      "latencyMs": 83845,
      "inputTokens": 83911,
      "outputTokens": 11629,
      "outputChars": 3408,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "templateVars"
        ],
        "modules": {
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 4
    },
    {
      "provider": "openrouter-qwen3",
      "model": "qwen/qwen3.5-122b-a10b",
      "test": "generate-cv",
      "scenario": "cv",
      "runStartedAt": 1778567134383,
      "latencyMs": 32204,
      "inputTokens": 114225,
      "outputTokens": 10645,
      "outputChars": 3198,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "templateVars"
        ],
        "modules": {
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 5
    },
    {
      "provider": "openrouter-glm-46",
      "model": "z-ai/glm-4.6",
      "test": "generate-cv",
      "scenario": "cv",
      "runStartedAt": 1778567134383,
      "latencyMs": 159235,
      "inputTokens": 107258,
      "outputTokens": 11678,
      "outputChars": 3638,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "templateVars"
        ],
        "modules": {
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 5
    },
    {
      "provider": "openrouter-deepseek-v4",
      "model": "deepseek/deepseek-v4-pro",
      "test": "generate-cv",
      "scenario": "cv",
      "runStartedAt": 1778567134383,
      "latencyMs": 75049,
      "inputTokens": 112205,
      "outputTokens": 12381,
      "outputChars": 3272,
      "valid": false,
      "dslParsed": true,
      "catalogErrors": 3,
      "catalogWarnings": 0,
      "issues": [
        "3 catalog error(s)",
        "  ✗ page > template:each > column > template:each > row > column > span > ?: \"span\" has an object without a tag in kids[0] — expected a node (with a tag) or string. Arrays of nodes must be spread, not nested; in the DSL, pass children as separate args or let each()/when() flatten them.",
        "  ✗ page > template:each > row > column > span > ?: \"span\" has an object without a tag in kids[0] — expected a node (with a tag) or string. Arrays of nodes must be spread, not nested; in the DSL, pass children as separate args or let each()/when() flatten them.",
        "  ✗ page > template:each > row > column > span > ?: \"span\" has an object without a tag in kids[0] — expected a node (with a tag) or string. Arrays of nodes must be spread, not nested; in the DSL, pass children as separate args or let each()/when() flatten them."
      ],
      "rendered": {
        "pages": 1,
        "sizeKB": 29
      },
      "renderError": null,
      "error": null,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "templateVars"
        ],
        "modules": {
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 5,
      "cleanReached": false
    },
    {
      "provider": "openrouter-kimi-k2",
      "model": "moonshotai/kimi-k2",
      "test": "generate-cv",
      "scenario": "cv",
      "runStartedAt": 1778567134383,
      "latencyMs": 27190,
      "inputTokens": 82202,
      "outputTokens": 4022,
      "outputChars": 3630,
      "valid": false,
      "dslParsed": false,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [
        "DSL execution failed: DSL execution failed: Unexpected token (110:17)\n  |   education: Um  {\n  |                  ^",
        "Missing const template = doc(...)",
        "Missing const sampleData = {...}"
      ],
      "rendered": null,
      "renderError": null,
      "error": null,
      "cyclesUsed": 4,
      "cleanReached": false
    },
    {
      "provider": "openrouter-gpt5-1-codex-mini",
      "model": "openai/gpt-5.1-codex-mini",
      "test": "generate-cv",
      "scenario": "cv",
      "runStartedAt": 1778567134383,
      "latencyMs": 30879,
      "inputTokens": 111581,
      "outputTokens": 24865,
      "outputChars": 4678,
      "valid": false,
      "dslParsed": true,
      "catalogErrors": 10,
      "catalogWarnings": 0,
      "issues": [
        "10 catalog error(s)",
        "  ✗ kids[0].kids[0].kids[8].kids[0].kids[0].kids[0].kids[0].kids[0]: \"column\" cannot contain plain-string children — wrap text in a <span> or use a container that allows strings (allowed children: column, row, flow, text, span, img, input, checkbox, select, template:each, template:if, template:else-if, template:else).",
        "  ✗ kids[0].kids[0].kids[8].kids[0].kids[0].kids[0].kids[1].kids[0]: \"column\" cannot contain plain-string children — wrap text in a <span> or use a container that allows strings (allowed children: column, row, flow, text, span, img, input, checkbox, select, template:each, template:if, template:else-if, template:else).",
        "  ✗ page > column > column > template:each > column > row > column > ?: \"column\" has an object without a tag in kids[1] — expected a node (with a tag) or string. Arrays of nodes must be spread, not nested; in the DSL, pass children as separate args or let each()/when() flatten them.",
        "  ✗ kids[0].kids[0].kids[8].kids[0].kids[0].kids[2].kids[0].kids[0].kids[0].kids[0]: \"column\" cannot contain plain-string children — wrap text in a <span> or use a container that allows strings (allowed children: column, row, flow, text, span, img, input, checkbox, select, template:each, template:if, template:else-if, template:else).",
        "  ✗ kids[0].kids[0].kids[8].kids[0].kids[0].kids[2].kids[0].kids[0].kids[1].kids[0]: \"column\" cannot contain plain-string children — wrap text in a <span> or use a container that allows strings (allowed children: column, row, flow, text, span, img, input, checkbox, select, template:each, template:if, template:else-if, template:else).",
        "  ✗ kids[0].kids[0].kids[11].kids[0].kids[0].kids[0].kids[0]: \"column\" cannot contain plain-string children — wrap text in a <span> or use a container that allows strings (allowed children: column, row, flow, text, span, img, input, checkbox, select, template:each, template:if, template:else-if, template:else).",
        "  ✗ kids[0].kids[0].kids[11].kids[0].kids[0].kids[1].kids[0]: \"column\" cannot contain plain-string children — wrap text in a <span> or use a container that allows strings (allowed children: column, row, flow, text, span, img, input, checkbox, select, template:each, template:if, template:else-if, template:else).",
        "  ✗ kids[0].kids[0].kids[14].kids[0].kids[0].kids[0].kids[0].kids[0]: \"column\" cannot contain plain-string children — wrap text in a <span> or use a container that allows strings (allowed children: column, row, flow, text, span, img, input, checkbox, select, template:each, template:if, template:else-if, template:else).",
        "  ✗ kids[0].kids[0].kids[14].kids[0].kids[0].kids[0].kids[1].kids[0]: \"column\" cannot contain plain-string children — wrap text in a <span> or use a container that allows strings (allowed children: column, row, flow, text, span, img, input, checkbox, select, template:each, template:if, template:else-if, template:else).",
        "  ✗ page > column > column > template:each > column > row > column > ?: \"column\" has an object without a tag in kids[1] — expected a node (with a tag) or string. Arrays of nodes must be spread, not nested; in the DSL, pass children as separate args or let each()/when() flatten them."
      ],
      "rendered": {
        "pages": 2,
        "sizeKB": 33
      },
      "renderError": null,
      "error": null,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 5,
      "cleanReached": false
    },
    {
      "provider": "openrouter-qwen3-32b",
      "model": "qwen/qwen3-32b",
      "test": "generate-cv",
      "scenario": "cv",
      "runStartedAt": 1778567134383,
      "latencyMs": 36570,
      "inputTokens": 108603,
      "outputTokens": 12780,
      "outputChars": 3021,
      "valid": false,
      "dslParsed": true,
      "catalogErrors": 1,
      "catalogWarnings": 0,
      "issues": [
        "1 catalog error(s)",
        "  ✗ page > row > column > text > column: \"column\" inside \"text\" — \"text\" only accepts span, this-page, total-pages, string as children. Block elements inside inline containers (text/span) produce NaN coordinates at render time."
      ],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "templateVars"
        ],
        "modules": {
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 5,
      "cleanReached": false
    },
    {
      "provider": "openrouter-claude-sonnet",
      "model": "anthropic/claude-sonnet-4.6",
      "test": "fix-broken",
      "scenario": "fix",
      "runStartedAt": 1778567134383,
      "latencyMs": 25360,
      "inputTokens": 43930,
      "outputTokens": 7889,
      "outputChars": 650,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 26
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-claude-haiku",
      "model": "anthropic/claude-haiku-4.5",
      "test": "fix-broken",
      "scenario": "fix",
      "runStartedAt": 1778567134383,
      "latencyMs": 35732,
      "inputTokens": 44013,
      "outputTokens": 11978,
      "outputChars": 709,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 26
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-gpt5",
      "model": "openai/gpt-5",
      "test": "fix-broken",
      "scenario": "fix",
      "runStartedAt": 1778567134383,
      "latencyMs": 44561,
      "inputTokens": 57208,
      "outputTokens": 6291,
      "outputChars": 734,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 26
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 3
    },
    {
      "provider": "openrouter-gpt5-mini",
      "model": "openai/gpt-5-mini",
      "test": "fix-broken",
      "scenario": "fix",
      "runStartedAt": 1778567134383,
      "latencyMs": 15467,
      "inputTokens": 37854,
      "outputTokens": 3342,
      "outputChars": 887,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 27
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-gpt5-4-mini",
      "model": "openai/gpt-5.4-mini",
      "test": "fix-broken",
      "scenario": "fix",
      "runStartedAt": 1778567134383,
      "latencyMs": 14882,
      "inputTokens": 37833,
      "outputTokens": 3492,
      "outputChars": 713,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 26
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-gpt5-4-nano",
      "model": "openai/gpt-5.4-nano",
      "test": "fix-broken",
      "scenario": "fix",
      "runStartedAt": 1778567134383,
      "latencyMs": 6721,
      "inputTokens": 37851,
      "outputTokens": 2649,
      "outputChars": 811,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 27
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-gemini-pro",
      "model": "google/gemini-2.5-pro",
      "test": "fix-broken",
      "scenario": "fix",
      "runStartedAt": 1778567134383,
      "latencyMs": 31303,
      "inputTokens": 41721,
      "outputTokens": 9638,
      "outputChars": 696,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 26
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-grok",
      "model": "x-ai/grok-4",
      "test": "fix-broken",
      "scenario": "fix",
      "runStartedAt": 1778567134383,
      "latencyMs": 17174,
      "inputTokens": 58376,
      "outputTokens": 9482,
      "outputChars": 620,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 26
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 3
    },
    {
      "provider": "openrouter-qwen3",
      "model": "qwen/qwen3.5-122b-a10b",
      "test": "fix-broken",
      "scenario": "fix",
      "runStartedAt": 1778567134383,
      "latencyMs": 8883,
      "inputTokens": 40264,
      "outputTokens": 2173,
      "outputChars": 682,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 26
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-glm-46",
      "model": "z-ai/glm-4.6",
      "test": "fix-broken",
      "scenario": "fix",
      "runStartedAt": 1778567134383,
      "latencyMs": 230720,
      "inputTokens": 38007,
      "outputTokens": 1657,
      "outputChars": 680,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 26
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-deepseek-v4",
      "model": "deepseek/deepseek-v4-pro",
      "test": "fix-broken",
      "scenario": "fix",
      "runStartedAt": 1778567134383,
      "latencyMs": 4173,
      "inputTokens": 39235,
      "outputTokens": 2012,
      "outputChars": 650,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 26
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-kimi-k2",
      "model": "moonshotai/kimi-k2",
      "test": "fix-broken",
      "scenario": "fix",
      "runStartedAt": 1778567134383,
      "latencyMs": 7438,
      "inputTokens": 37680,
      "outputTokens": 436,
      "outputChars": 651,
      "valid": false,
      "dslParsed": false,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [
        "DSL execution failed: DSL execution failed: \"undefined\" is not defined (11:26)",
        "Missing const template = doc(...)",
        "Missing const sampleData = {...}"
      ],
      "rendered": null,
      "renderError": null,
      "error": null,
      "cyclesUsed": 2,
      "cleanReached": false
    },
    {
      "provider": "openrouter-gpt5-1-codex-mini",
      "model": "openai/gpt-5.1-codex-mini",
      "test": "fix-broken",
      "scenario": "fix",
      "runStartedAt": 1778567134383,
      "latencyMs": 5621,
      "inputTokens": 57278,
      "outputTokens": 2974,
      "outputChars": 880,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 26
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 3
    },
    {
      "provider": "openrouter-qwen3-32b",
      "model": "qwen/qwen3-32b",
      "test": "fix-broken",
      "scenario": "fix",
      "runStartedAt": 1778567134383,
      "latencyMs": 133073,
      "inputTokens": 38798,
      "outputTokens": 15178,
      "outputChars": 819,
      "valid": false,
      "dslParsed": false,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [
        "DSL execution failed: DSL execution failed: object is not iterable (cannot read property Symbol(Symbol.iterator))",
        "Missing const template = doc(...)",
        "Missing const sampleData = {...}"
      ],
      "rendered": null,
      "renderError": null,
      "error": null,
      "cyclesUsed": 2,
      "cleanReached": false
    },
    {
      "provider": "openrouter-claude-sonnet",
      "model": "anthropic/claude-sonnet-4.6",
      "test": "chat-edit-invoice",
      "scenario": "chat-edit",
      "runStartedAt": 1778567134383,
      "latencyMs": 26706,
      "inputTokens": 93785,
      "outputTokens": 4642,
      "outputChars": 2423,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "chatEditChain": {
        "score": 1,
        "turns": [
          {
            "id": "bold-totals",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "font-swap",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "thanks-line",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "header-underline",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          }
        ]
      },
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1,
      "cleanReached": true
    },
    {
      "provider": "openrouter-claude-haiku",
      "model": "anthropic/claude-haiku-4.5",
      "test": "chat-edit-invoice",
      "scenario": "chat-edit",
      "runStartedAt": 1778567134383,
      "latencyMs": 43091,
      "inputTokens": 93883,
      "outputTokens": 11568,
      "outputChars": 2357,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "chatEditChain": {
        "score": 1,
        "turns": [
          {
            "id": "bold-totals",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "font-swap",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "thanks-line",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "header-underline",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          }
        ]
      },
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1,
      "cleanReached": true
    },
    {
      "provider": "openrouter-gpt5",
      "model": "openai/gpt-5",
      "test": "chat-edit-invoice",
      "scenario": "chat-edit",
      "runStartedAt": 1778567134383,
      "latencyMs": 31955,
      "inputTokens": 80456,
      "outputTokens": 5603,
      "outputChars": 2259,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "chatEditChain": {
        "score": 1,
        "turns": [
          {
            "id": "bold-totals",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "font-swap",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "thanks-line",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "header-underline",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          }
        ]
      },
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1,
      "cleanReached": true
    },
    {
      "provider": "openrouter-gpt5-mini",
      "model": "openai/gpt-5-mini",
      "test": "chat-edit-invoice",
      "scenario": "chat-edit",
      "runStartedAt": 1778567134383,
      "latencyMs": 13107,
      "inputTokens": 80688,
      "outputTokens": 4889,
      "outputChars": 2469,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "chatEditChain": {
        "score": 1,
        "turns": [
          {
            "id": "bold-totals",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "font-swap",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "thanks-line",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "header-underline",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          }
        ]
      },
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1,
      "cleanReached": true
    },
    {
      "provider": "openrouter-gpt5-4-mini",
      "model": "openai/gpt-5.4-mini",
      "test": "chat-edit-invoice",
      "scenario": "chat-edit",
      "runStartedAt": 1778567134383,
      "latencyMs": 6665,
      "inputTokens": 80419,
      "outputTokens": 3319,
      "outputChars": 2267,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "chatEditChain": {
        "score": 1,
        "turns": [
          {
            "id": "bold-totals",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "font-swap",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "thanks-line",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "header-underline",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          }
        ]
      },
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1,
      "cleanReached": true
    },
    {
      "provider": "openrouter-gpt5-4-nano",
      "model": "openai/gpt-5.4-nano",
      "test": "chat-edit-invoice",
      "scenario": "chat-edit",
      "runStartedAt": 1778567134383,
      "latencyMs": 12067,
      "inputTokens": 80803,
      "outputTokens": 3772,
      "outputChars": 2589,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "chatEditChain": {
        "score": 1,
        "turns": [
          {
            "id": "bold-totals",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "font-swap",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "thanks-line",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "header-underline",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          }
        ]
      },
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1,
      "cleanReached": true
    },
    {
      "provider": "openrouter-gemini-pro",
      "model": "google/gemini-2.5-pro",
      "test": "chat-edit-invoice",
      "scenario": "chat-edit",
      "runStartedAt": 1778567134383,
      "latencyMs": 21747,
      "inputTokens": 89418,
      "outputTokens": 17075,
      "outputChars": 2411,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "chatEditChain": {
        "score": 1,
        "turns": [
          {
            "id": "bold-totals",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "font-swap",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "thanks-line",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "header-underline",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          }
        ]
      },
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1,
      "cleanReached": true
    },
    {
      "provider": "openrouter-grok",
      "model": "x-ai/grok-4",
      "test": "chat-edit-invoice",
      "scenario": "chat-edit",
      "runStartedAt": 1778567134383,
      "latencyMs": 61403,
      "inputTokens": 153634,
      "outputTokens": 15318,
      "outputChars": 3063,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "chatEditChain": {
        "score": 1,
        "turns": [
          {
            "id": "bold-totals",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "font-swap",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "thanks-line",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "header-underline",
            "passed": true,
            "cyclesUsed": 4,
            "errors": []
          }
        ]
      },
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 4,
      "cleanReached": true
    },
    {
      "provider": "openrouter-qwen3",
      "model": "qwen/qwen3.5-122b-a10b",
      "test": "chat-edit-invoice",
      "scenario": "chat-edit",
      "runStartedAt": 1778567134383,
      "latencyMs": 12167,
      "inputTokens": 86414,
      "outputTokens": 4245,
      "outputChars": 2448,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "chatEditChain": {
        "score": 1,
        "turns": [
          {
            "id": "bold-totals",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "font-swap",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "thanks-line",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "header-underline",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          }
        ]
      },
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1,
      "cleanReached": true
    },
    {
      "provider": "openrouter-glm-46",
      "model": "z-ai/glm-4.6",
      "test": "chat-edit-invoice",
      "scenario": "chat-edit",
      "runStartedAt": 1778567134383,
      "latencyMs": 211304,
      "inputTokens": 81065,
      "outputTokens": 3012,
      "outputChars": 2355,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "chatEditChain": {
        "score": 1,
        "turns": [
          {
            "id": "bold-totals",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "font-swap",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "thanks-line",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "header-underline",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          }
        ]
      },
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1,
      "cleanReached": true
    },
    {
      "provider": "openrouter-deepseek-v4",
      "model": "deepseek/deepseek-v4-pro",
      "test": "chat-edit-invoice",
      "scenario": "chat-edit",
      "runStartedAt": 1778567134383,
      "latencyMs": 90707,
      "inputTokens": 106632,
      "outputTokens": 8979,
      "outputChars": 2419,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "chatEditChain": {
        "score": 1,
        "turns": [
          {
            "id": "bold-totals",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "font-swap",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "thanks-line",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "header-underline",
            "passed": true,
            "cyclesUsed": 2,
            "errors": []
          }
        ]
      },
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2,
      "cleanReached": true
    },
    {
      "provider": "openrouter-kimi-k2",
      "model": "moonshotai/kimi-k2",
      "test": "chat-edit-invoice",
      "scenario": "chat-edit",
      "runStartedAt": 1778567134383,
      "latencyMs": 21565,
      "inputTokens": 102144,
      "outputTokens": 3450,
      "outputChars": 2541,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 33
      },
      "renderError": null,
      "error": null,
      "chatEditChain": {
        "score": 1,
        "turns": [
          {
            "id": "bold-totals",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "font-swap",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "thanks-line",
            "passed": true,
            "cyclesUsed": 2,
            "errors": []
          },
          {
            "id": "header-underline",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          }
        ]
      },
      "skillCompliance": {
        "score": 0.9375,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 0.875,
            "errors": 0,
            "warnings": 1,
            "rules": [
              {
                "rule": "T4",
                "severity": "warning",
                "message": "Row has 5 cells but parent table has 4 columns — use colspan on the label cell to align"
              }
            ]
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2,
      "cleanReached": true
    },
    {
      "provider": "openrouter-gpt5-1-codex-mini",
      "model": "openai/gpt-5.1-codex-mini",
      "test": "chat-edit-invoice",
      "scenario": "chat-edit",
      "runStartedAt": 1778567134383,
      "latencyMs": 14383,
      "inputTokens": 80575,
      "outputTokens": 6200,
      "outputChars": 2378,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 2,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "chatEditChain": {
        "score": 1,
        "turns": [
          {
            "id": "bold-totals",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "font-swap",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "thanks-line",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "header-underline",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          }
        ]
      },
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1,
      "cleanReached": true
    },
    {
      "provider": "openrouter-qwen3-32b",
      "model": "qwen/qwen3-32b",
      "test": "chat-edit-invoice",
      "scenario": "chat-edit",
      "runStartedAt": 1778567134383,
      "latencyMs": 32421,
      "inputTokens": 83128,
      "outputTokens": 8480,
      "outputChars": 2279,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "chatEditChain": {
        "score": 0.875,
        "turns": [
          {
            "id": "bold-totals",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "font-swap",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "thanks-line",
            "passed": true,
            "cyclesUsed": 1,
            "errors": [
              "C3: Thank-you line is present and centered but not italic."
            ]
          },
          {
            "id": "header-underline",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          }
        ]
      },
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1,
      "cleanReached": true
    },
    {
      "provider": "openrouter-claude-opus",
      "model": "anthropic/claude-opus-4.7",
      "test": "generate-invoice",
      "scenario": "generate",
      "runStartedAt": 1778632001243,
      "latencyMs": 16824,
      "inputTokens": 60228,
      "outputTokens": 3858,
      "outputChars": 3081,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 35
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-gpt5-5",
      "model": "openai/gpt-5.5",
      "test": "generate-invoice",
      "scenario": "generate",
      "runStartedAt": 1778632001243,
      "latencyMs": 35361,
      "inputTokens": 39297,
      "outputTokens": 3750,
      "outputChars": 5141,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 36
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-gpt5-4",
      "model": "openai/gpt-5.4",
      "test": "generate-invoice",
      "scenario": "generate",
      "runStartedAt": 1778632001243,
      "latencyMs": 47137,
      "inputTokens": 39110,
      "outputTokens": 5925,
      "outputChars": 3388,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 35
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-grok-4-20",
      "model": "x-ai/grok-4.20",
      "test": "generate-invoice",
      "scenario": "generate",
      "runStartedAt": 1778632001243,
      "latencyMs": 67106,
      "inputTokens": 103854,
      "outputTokens": 23607,
      "outputChars": 2697,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 35
      },
      "renderError": null,
      "error": null,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 5,
      "cleanReached": false
    },
    {
      "provider": "openrouter-grok-4-fast",
      "model": "x-ai/grok-4-fast",
      "test": "generate-invoice",
      "scenario": "generate",
      "runStartedAt": 1778632001243,
      "latencyMs": 98111,
      "inputTokens": 38828,
      "outputTokens": 13339,
      "outputChars": 2882,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 34
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-glm-47",
      "model": "z-ai/glm-4.7",
      "test": "generate-invoice",
      "scenario": "generate",
      "runStartedAt": 1778632001243,
      "latencyMs": 388910,
      "inputTokens": 39085,
      "outputTokens": 8225,
      "outputChars": 2466,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 34
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-kimi-k2-6",
      "model": "moonshotai/kimi-k2.6",
      "test": "generate-invoice",
      "scenario": "generate",
      "runStartedAt": 1778632001243,
      "latencyMs": 907768,
      "inputTokens": 38836,
      "outputTokens": 27198,
      "outputChars": 2839,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 34
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-deepseek-v4-flash",
      "model": "deepseek/deepseek-v4-flash",
      "test": "generate-invoice",
      "scenario": "generate",
      "runStartedAt": 1778632001243,
      "latencyMs": 14895,
      "inputTokens": 19654,
      "outputTokens": 1397,
      "outputChars": 2700,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 34
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1
    },
    {
      "provider": "openrouter-qwen3-6-max",
      "model": "qwen/qwen3.6-max-preview",
      "test": "generate-invoice",
      "scenario": "generate",
      "runStartedAt": 1778632001243,
      "latencyMs": 121413,
      "inputTokens": 112640,
      "outputTokens": 20701,
      "outputChars": 2604,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 35
      },
      "renderError": null,
      "error": null,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 5,
      "cleanReached": false
    },
    {
      "provider": "openrouter-llama4-maverick",
      "model": "meta-llama/llama-4-maverick",
      "test": "generate-invoice",
      "scenario": "generate",
      "runStartedAt": 1778632001243,
      "latencyMs": 15599,
      "inputTokens": 18907,
      "outputTokens": 804,
      "outputChars": 2487,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 35
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1
    },
    {
      "provider": "openrouter-mistral-medium",
      "model": "mistralai/mistral-medium-3-5",
      "test": "generate-invoice",
      "scenario": "generate",
      "runStartedAt": 1778632001243,
      "latencyMs": 6978,
      "inputTokens": 19978,
      "outputTokens": 919,
      "outputChars": 2549,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 35
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1
    },
    {
      "provider": "openrouter-claude-opus",
      "model": "anthropic/claude-opus-4.7",
      "test": "adapt-invoice",
      "scenario": "adapt",
      "runStartedAt": 1778632001243,
      "latencyMs": 35059,
      "inputTokens": 62387,
      "outputTokens": 5595,
      "outputChars": 2686,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 34
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-gpt5-5",
      "model": "openai/gpt-5.5",
      "test": "adapt-invoice",
      "scenario": "adapt",
      "runStartedAt": 1778632001243,
      "latencyMs": 19304,
      "inputTokens": 40449,
      "outputTokens": 2615,
      "outputChars": 2827,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 34
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-gpt5-4",
      "model": "openai/gpt-5.4",
      "test": "adapt-invoice",
      "scenario": "adapt",
      "runStartedAt": 1778632001243,
      "latencyMs": 58205,
      "inputTokens": 40372,
      "outputTokens": 5090,
      "outputChars": 2957,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 34
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-grok-4-20",
      "model": "x-ai/grok-4.20",
      "test": "adapt-invoice",
      "scenario": "adapt",
      "runStartedAt": 1778632001243,
      "latencyMs": 68299,
      "inputTokens": 108883,
      "outputTokens": 27442,
      "outputChars": 2992,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 2,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 34
      },
      "renderError": null,
      "error": null,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 5,
      "cleanReached": false
    },
    {
      "provider": "openrouter-grok-4-fast",
      "model": "x-ai/grok-4-fast",
      "test": "adapt-invoice",
      "scenario": "adapt",
      "runStartedAt": 1778632001243,
      "latencyMs": 67696,
      "inputTokens": 40144,
      "outputTokens": 11476,
      "outputChars": 2613,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 34
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-glm-47",
      "model": "z-ai/glm-4.7",
      "test": "adapt-invoice",
      "scenario": "adapt",
      "runStartedAt": 1778632001243,
      "latencyMs": 70953,
      "inputTokens": 109113,
      "outputTokens": 21363,
      "outputChars": 2649,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 33
      },
      "renderError": null,
      "error": null,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 5,
      "cleanReached": false
    },
    {
      "provider": "openrouter-deepseek-v4-flash",
      "model": "deepseek/deepseek-v4-flash",
      "test": "adapt-invoice",
      "scenario": "adapt",
      "runStartedAt": 1778632001243,
      "latencyMs": 37448,
      "inputTokens": 64260,
      "outputTokens": 5001,
      "outputChars": 2425,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 2,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 34
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 3
    },
    {
      "provider": "openrouter-qwen3-6-max",
      "model": "qwen/qwen3.6-max-preview",
      "test": "adapt-invoice",
      "scenario": "adapt",
      "runStartedAt": 1778632001243,
      "latencyMs": 83737,
      "inputTokens": 66703,
      "outputTokens": 10731,
      "outputChars": 2410,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 33
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 3
    },
    {
      "provider": "openrouter-llama4-maverick",
      "model": "meta-llama/llama-4-maverick",
      "test": "adapt-invoice",
      "scenario": "adapt",
      "runStartedAt": 1778632001243,
      "latencyMs": 37705,
      "inputTokens": 61909,
      "outputTokens": 2434,
      "outputChars": 2465,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 34
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 3
    },
    {
      "provider": "openrouter-mistral-medium",
      "model": "mistralai/mistral-medium-3-5",
      "test": "adapt-invoice",
      "scenario": "adapt",
      "runStartedAt": 1778632001243,
      "latencyMs": 6742,
      "inputTokens": 42568,
      "outputTokens": 1817,
      "outputChars": 2416,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 33
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-claude-opus",
      "model": "anthropic/claude-opus-4.7",
      "test": "paginate-invoice",
      "scenario": "paginate",
      "runStartedAt": 1778632001243,
      "latencyMs": 23510,
      "inputTokens": 32167,
      "outputTokens": 3615,
      "outputChars": 7419,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 2,
        "sizeKB": 57
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1
    },
    {
      "provider": "openrouter-gpt5-5",
      "model": "openai/gpt-5.5",
      "test": "paginate-invoice",
      "scenario": "paginate",
      "runStartedAt": 1778632001243,
      "latencyMs": 48782,
      "inputTokens": 43933,
      "outputTokens": 5839,
      "outputChars": 9690,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 2,
        "sizeKB": 58
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-gpt5-4",
      "model": "openai/gpt-5.4",
      "test": "paginate-invoice",
      "scenario": "paginate",
      "runStartedAt": 1778632001243,
      "latencyMs": 201498,
      "inputTokens": 21187,
      "outputTokens": 8620,
      "outputChars": 10721,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 2,
        "sizeKB": 58
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1
    },
    {
      "provider": "openrouter-grok-4-20",
      "model": "x-ai/grok-4.20",
      "test": "paginate-invoice",
      "scenario": "paginate",
      "runStartedAt": 1778632001243,
      "latencyMs": 45106,
      "inputTokens": 45246,
      "outputTokens": 14381,
      "outputChars": 9301,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 2,
        "sizeKB": 55
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-grok-4-fast",
      "model": "x-ai/grok-4-fast",
      "test": "paginate-invoice",
      "scenario": "paginate",
      "runStartedAt": 1778632001243,
      "latencyMs": 33947,
      "inputTokens": 21060,
      "outputTokens": 3915,
      "outputChars": 8974,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 3,
        "sizeKB": 58
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1
    },
    {
      "provider": "openrouter-glm-47",
      "model": "z-ai/glm-4.7",
      "test": "paginate-invoice",
      "scenario": "paginate",
      "runStartedAt": 1778632001243,
      "latencyMs": 139858,
      "inputTokens": 101171,
      "outputTokens": 29811,
      "outputChars": 6900,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 2,
        "sizeKB": 56
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 4
    },
    {
      "provider": "openrouter-kimi-k2-6",
      "model": "moonshotai/kimi-k2.6",
      "test": "paginate-invoice",
      "scenario": "paginate",
      "runStartedAt": 1778632001243,
      "latencyMs": 83986,
      "inputTokens": 43216,
      "outputTokens": 17178,
      "outputChars": 7771,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 2,
        "sizeKB": 57
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-deepseek-v4-flash",
      "model": "deepseek/deepseek-v4-flash",
      "test": "paginate-invoice",
      "scenario": "paginate",
      "runStartedAt": 1778632001243,
      "latencyMs": 35309,
      "inputTokens": 46738,
      "outputTokens": 6808,
      "outputChars": 7986,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 2,
        "sizeKB": 57
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-qwen3-6-max",
      "model": "qwen/qwen3.6-max-preview",
      "test": "paginate-invoice",
      "scenario": "paginate",
      "runStartedAt": 1778632001243,
      "latencyMs": 147748,
      "inputTokens": 23005,
      "outputTokens": 6014,
      "outputChars": 7597,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 2,
        "sizeKB": 57
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1
    },
    {
      "provider": "openrouter-llama4-maverick",
      "model": "meta-llama/llama-4-maverick",
      "test": "paginate-invoice",
      "scenario": "paginate",
      "runStartedAt": 1778632001243,
      "latencyMs": 42538,
      "inputTokens": 67769,
      "outputTokens": 6044,
      "outputChars": 7515,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 2,
        "sizeKB": 56
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 3
    },
    {
      "provider": "openrouter-mistral-medium",
      "model": "mistralai/mistral-medium-3-5",
      "test": "paginate-invoice",
      "scenario": "paginate",
      "runStartedAt": 1778632001243,
      "latencyMs": 16289,
      "inputTokens": 72575,
      "outputTokens": 7118,
      "outputChars": 7767,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 3,
        "sizeKB": 56
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 3
    },
    {
      "provider": "openrouter-claude-opus",
      "model": "anthropic/claude-opus-4.7",
      "test": "generate-cv",
      "scenario": "cv",
      "runStartedAt": 1778632001243,
      "latencyMs": 28003,
      "inputTokens": 94110,
      "outputTokens": 7571,
      "outputChars": 4543,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 34
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 3
    },
    {
      "provider": "openrouter-gpt5-5",
      "model": "openai/gpt-5.5",
      "test": "generate-cv",
      "scenario": "cv",
      "runStartedAt": 1778632001243,
      "latencyMs": 26288,
      "inputTokens": 39302,
      "outputTokens": 3736,
      "outputChars": 4649,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 33
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "templateVars"
        ],
        "modules": {
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-gpt5-4",
      "model": "openai/gpt-5.4",
      "test": "generate-cv",
      "scenario": "cv",
      "runStartedAt": 1778632001243,
      "latencyMs": 24417,
      "inputTokens": 39343,
      "outputTokens": 7417,
      "outputChars": 4580,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "templateVars"
        ],
        "modules": {
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-grok-4-20",
      "model": "x-ai/grok-4.20",
      "test": "generate-cv",
      "scenario": "cv",
      "runStartedAt": 1778632001243,
      "latencyMs": 90317,
      "inputTokens": 38832,
      "outputTokens": 11359,
      "outputChars": 3752,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 33
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "templateVars"
        ],
        "modules": {
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-grok-4-fast",
      "model": "x-ai/grok-4-fast",
      "test": "generate-cv",
      "scenario": "cv",
      "runStartedAt": 1778632001243,
      "latencyMs": 90268,
      "inputTokens": 39470,
      "outputTokens": 9025,
      "outputChars": 3816,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 33
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "templateVars"
        ],
        "modules": {
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-glm-47",
      "model": "z-ai/glm-4.7",
      "test": "generate-cv",
      "scenario": "cv",
      "runStartedAt": 1778632001243,
      "latencyMs": 42729,
      "inputTokens": 59769,
      "outputTokens": 11244,
      "outputChars": 2935,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 2,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "templateVars"
        ],
        "modules": {
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 3
    },
    {
      "provider": "openrouter-deepseek-v4-flash",
      "model": "deepseek/deepseek-v4-flash",
      "test": "generate-cv",
      "scenario": "cv",
      "runStartedAt": 1778632001243,
      "latencyMs": 88578,
      "inputTokens": 64086,
      "outputTokens": 7821,
      "outputChars": 4669,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "templateVars"
        ],
        "modules": {
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 3
    },
    {
      "provider": "openrouter-llama4-maverick",
      "model": "meta-llama/llama-4-maverick",
      "test": "generate-cv",
      "scenario": "cv",
      "runStartedAt": 1778632001243,
      "latencyMs": 23085,
      "inputTokens": 38657,
      "outputTokens": 1829,
      "outputChars": 3318,
      "valid": false,
      "dslParsed": false,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [
        "DSL execution failed: DSL execution failed: \"undefined\" is not defined (1:13)",
        "Missing const template = doc(...)",
        "Missing const sampleData = {...}"
      ],
      "rendered": null,
      "renderError": null,
      "error": null,
      "cyclesUsed": 2,
      "cleanReached": false
    },
    {
      "provider": "openrouter-mistral-medium",
      "model": "mistralai/mistral-medium-3-5",
      "test": "generate-cv",
      "scenario": "cv",
      "runStartedAt": 1778632001243,
      "latencyMs": 7508,
      "inputTokens": 113452,
      "outputTokens": 5385,
      "outputChars": 3683,
      "valid": false,
      "dslParsed": true,
      "catalogErrors": 1,
      "catalogWarnings": 1,
      "issues": [
        "1 catalog error(s)",
        "  ✗ page > column > column > template:each > text > template:if: \"template:if\" inside \"text\" — \"text\" only accepts span, this-page, total-pages, string as children. Block elements inside inline containers (text/span) produce NaN coordinates at render time."
      ],
      "rendered": null,
      "renderError": "Error: NaN Height!\n    at Module.setHeight (/Users/jason/dev/pdf/makesPDF/packages/@pdf/layout-engine/src/element.ts:101:11)\n    at setElHeights (/Users/jason/dev/pdf/makesPDF/packages/@pdf/layout-engine/src/child-height.ts:55:18)\n    at Array.map (<anonymous>)\n    at setElHeights (/Users/jason/dev/pdf/makesPDF/packages/@pdf/layout-engine/src/child-height.ts:49:48)\n    at Array.map (<anonymous>)\n    at setElHeights (/Users/jason/dev/pdf/makesPDF/packages/@pdf/layout-engine/src/child-height.ts:49:48)\n    at Array.map (<anonymous>)\n    at setElHeights (/Users/jason/dev/pdf/makesPDF/packages/@pdf/layout-engine/src/child-height.ts:49:48)\n    at Array.map (<anonymous>)\n    at <anonymous> (/Users/jason/dev/pdf/makesPDF/packages/@pdf/layout-engine/src/child-height.ts:157:31)",
      "error": null,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "templateVars"
        ],
        "modules": {
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 5,
      "cleanReached": false
    },
    {
      "provider": "openrouter-claude-opus",
      "model": "anthropic/claude-opus-4.7",
      "test": "fix-broken",
      "scenario": "fix",
      "runStartedAt": 1778632001243,
      "latencyMs": 3180,
      "inputTokens": 58309,
      "outputTokens": 2418,
      "outputChars": 726,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 26
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-gpt5-5",
      "model": "openai/gpt-5.5",
      "test": "fix-broken",
      "scenario": "fix",
      "runStartedAt": 1778632001243,
      "latencyMs": 12874,
      "inputTokens": 37930,
      "outputTokens": 1977,
      "outputChars": 1098,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 26
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-gpt5-4",
      "model": "openai/gpt-5.4",
      "test": "fix-broken",
      "scenario": "fix",
      "runStartedAt": 1778632001243,
      "latencyMs": 5282,
      "inputTokens": 37835,
      "outputTokens": 1502,
      "outputChars": 715,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 26
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-grok-4-20",
      "model": "x-ai/grok-4.20",
      "test": "fix-broken",
      "scenario": "fix",
      "runStartedAt": 1778632001243,
      "latencyMs": 34655,
      "inputTokens": 37477,
      "outputTokens": 7142,
      "outputChars": 602,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 26
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-grok-4-fast",
      "model": "x-ai/grok-4-fast",
      "test": "fix-broken",
      "scenario": "fix",
      "runStartedAt": 1778632001243,
      "latencyMs": 21161,
      "inputTokens": 56847,
      "outputTokens": 4918,
      "outputChars": 604,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 26
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 3
    },
    {
      "provider": "openrouter-glm-47",
      "model": "z-ai/glm-4.7",
      "test": "fix-broken",
      "scenario": "fix",
      "runStartedAt": 1778632001243,
      "latencyMs": 137484,
      "inputTokens": 57843,
      "outputTokens": 13295,
      "outputChars": 751,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 26
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 3
    },
    {
      "provider": "openrouter-deepseek-v4-flash",
      "model": "deepseek/deepseek-v4-flash",
      "test": "fix-broken",
      "scenario": "fix",
      "runStartedAt": 1778632001243,
      "latencyMs": 4465,
      "inputTokens": 39123,
      "outputTokens": 3117,
      "outputChars": 625,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 26
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-llama4-maverick",
      "model": "meta-llama/llama-4-maverick",
      "test": "fix-broken",
      "scenario": "fix",
      "runStartedAt": 1778632001243,
      "latencyMs": 4088,
      "inputTokens": 37667,
      "outputTokens": 422,
      "outputChars": 634,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 26
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-mistral-medium",
      "model": "mistralai/mistral-medium-3-5",
      "test": "fix-broken",
      "scenario": "fix",
      "runStartedAt": 1778632001243,
      "latencyMs": 3841,
      "inputTokens": 59904,
      "outputTokens": 680,
      "outputChars": 680,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 1,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 26
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 3
    },
    {
      "provider": "openrouter-claude-opus",
      "model": "anthropic/claude-opus-4.7",
      "test": "chat-edit-invoice",
      "scenario": "chat-edit",
      "runStartedAt": 1778632001243,
      "latencyMs": 12583,
      "inputTokens": 124866,
      "outputTokens": 4652,
      "outputChars": 2455,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "chatEditChain": {
        "score": 1,
        "turns": [
          {
            "id": "bold-totals",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "font-swap",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "thanks-line",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "header-underline",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          }
        ]
      },
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1
    },
    {
      "provider": "openrouter-gpt5-5",
      "model": "openai/gpt-5.5",
      "test": "chat-edit-invoice",
      "scenario": "chat-edit",
      "runStartedAt": 1778632001243,
      "latencyMs": 9736,
      "inputTokens": 80660,
      "outputTokens": 3159,
      "outputChars": 2446,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "chatEditChain": {
        "score": 1,
        "turns": [
          {
            "id": "bold-totals",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "font-swap",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "thanks-line",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "header-underline",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          }
        ]
      },
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1
    },
    {
      "provider": "openrouter-gpt5-4",
      "model": "openai/gpt-5.4",
      "test": "chat-edit-invoice",
      "scenario": "chat-edit",
      "runStartedAt": 1778632001243,
      "latencyMs": 9727,
      "inputTokens": 80419,
      "outputTokens": 3568,
      "outputChars": 2223,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "chatEditChain": {
        "score": 1,
        "turns": [
          {
            "id": "bold-totals",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "font-swap",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "thanks-line",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "header-underline",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          }
        ]
      },
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1
    },
    {
      "provider": "openrouter-grok-4-20",
      "model": "x-ai/grok-4.20",
      "test": "chat-edit-invoice",
      "scenario": "chat-edit",
      "runStartedAt": 1778632001243,
      "latencyMs": 17143,
      "inputTokens": 82395,
      "outputTokens": 7633,
      "outputChars": 2413,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "chatEditChain": {
        "score": 1,
        "turns": [
          {
            "id": "bold-totals",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "font-swap",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "thanks-line",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "header-underline",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          }
        ]
      },
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1
    },
    {
      "provider": "openrouter-grok-4-fast",
      "model": "x-ai/grok-4-fast",
      "test": "chat-edit-invoice",
      "scenario": "chat-edit",
      "runStartedAt": 1778632001243,
      "latencyMs": 4765,
      "inputTokens": 80160,
      "outputTokens": 4345,
      "outputChars": 2365,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "chatEditChain": {
        "score": 1,
        "turns": [
          {
            "id": "bold-totals",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "font-swap",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "thanks-line",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "header-underline",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          }
        ]
      },
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1
    },
    {
      "provider": "openrouter-glm-47",
      "model": "z-ai/glm-4.7",
      "test": "chat-edit-invoice",
      "scenario": "chat-edit",
      "runStartedAt": 1778632001243,
      "latencyMs": 122937,
      "inputTokens": 81045,
      "outputTokens": 10733,
      "outputChars": 2413,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "chatEditChain": {
        "score": 1,
        "turns": [
          {
            "id": "bold-totals",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "font-swap",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "thanks-line",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "header-underline",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          }
        ]
      },
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1
    },
    {
      "provider": "openrouter-kimi-k2-6",
      "model": "moonshotai/kimi-k2.6",
      "test": "chat-edit-invoice",
      "scenario": "chat-edit",
      "runStartedAt": 1778632001243,
      "latencyMs": 26304,
      "inputTokens": 80473,
      "outputTokens": 12741,
      "outputChars": 2384,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "chatEditChain": {
        "score": 1,
        "turns": [
          {
            "id": "bold-totals",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "font-swap",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "thanks-line",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "header-underline",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          }
        ]
      },
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1
    },
    {
      "provider": "openrouter-deepseek-v4-flash",
      "model": "deepseek/deepseek-v4-flash",
      "test": "chat-edit-invoice",
      "scenario": "chat-edit",
      "runStartedAt": 1778632001243,
      "latencyMs": 14357,
      "inputTokens": 83394,
      "outputTokens": 3538,
      "outputChars": 2237,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "chatEditChain": {
        "score": 1,
        "turns": [
          {
            "id": "bold-totals",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "font-swap",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "thanks-line",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "header-underline",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          }
        ]
      },
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1
    },
    {
      "provider": "openrouter-qwen3-6-max",
      "model": "qwen/qwen3.6-max-preview",
      "test": "chat-edit-invoice",
      "scenario": "chat-edit",
      "runStartedAt": 1778632001243,
      "latencyMs": 86040,
      "inputTokens": 86239,
      "outputTokens": 10123,
      "outputChars": 2420,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "chatEditChain": {
        "score": 1,
        "turns": [
          {
            "id": "bold-totals",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "font-swap",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "thanks-line",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "header-underline",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          }
        ]
      },
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1
    },
    {
      "provider": "openrouter-llama4-maverick",
      "model": "meta-llama/llama-4-maverick",
      "test": "chat-edit-invoice",
      "scenario": "chat-edit",
      "runStartedAt": 1778632001243,
      "latencyMs": 15159,
      "inputTokens": 80397,
      "outputTokens": 2842,
      "outputChars": 2416,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "chatEditChain": {
        "score": 1,
        "turns": [
          {
            "id": "bold-totals",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "font-swap",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "thanks-line",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "header-underline",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          }
        ]
      },
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1
    },
    {
      "provider": "openrouter-mistral-medium",
      "model": "mistralai/mistral-medium-3-5",
      "test": "chat-edit-invoice",
      "scenario": "chat-edit",
      "runStartedAt": 1778632001243,
      "latencyMs": 6367,
      "inputTokens": 84836,
      "outputTokens": 3035,
      "outputChars": 2342,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "chatEditChain": {
        "score": 1,
        "turns": [
          {
            "id": "bold-totals",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "font-swap",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "thanks-line",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          },
          {
            "id": "header-underline",
            "passed": true,
            "cyclesUsed": 1,
            "errors": []
          }
        ]
      },
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 1
    },
    {
      "provider": "openrouter-qwen3-6-max",
      "model": "qwen/qwen3.6-max-preview",
      "test": "generate-cv",
      "scenario": "cv",
      "runStartedAt": 1778648120596,
      "latencyMs": 336437,
      "inputTokens": 115520,
      "outputTokens": 28020,
      "outputChars": 3643,
      "valid": false,
      "dslParsed": true,
      "catalogErrors": 1,
      "catalogWarnings": 0,
      "issues": [
        "1 catalog error(s)",
        "  ✗ page > column > column > column > template:each > text > template:if: \"template:if\" inside \"text\" — \"text\" only accepts span, this-page, total-pages, string as children. Block elements inside inline containers (text/span) produce NaN coordinates at render time."
      ],
      "rendered": {
        "pages": 1,
        "sizeKB": 32
      },
      "renderError": null,
      "error": null,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "templateVars"
        ],
        "modules": {
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 5,
      "cleanReached": false
    },
    {
      "provider": "openrouter-kimi-k2-6",
      "model": "moonshotai/kimi-k2.6",
      "test": "generate-cv",
      "scenario": "cv",
      "runStartedAt": 1778648120596,
      "latencyMs": 829187,
      "inputTokens": 38954,
      "outputTokens": 22397,
      "outputChars": 3413,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 31
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "templateVars"
        ],
        "modules": {
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-qwen3-6-max",
      "model": "qwen/qwen3.6-max-preview",
      "test": "fix-broken",
      "scenario": "fix",
      "runStartedAt": 1778648120596,
      "latencyMs": 106337,
      "inputTokens": 40245,
      "outputTokens": 7208,
      "outputChars": 641,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 26
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    },
    {
      "provider": "openrouter-kimi-k2-6",
      "model": "moonshotai/kimi-k2.6",
      "test": "fix-broken",
      "scenario": "fix",
      "runStartedAt": 1778648120596,
      "latencyMs": 693232,
      "inputTokens": 57026,
      "outputTokens": 27882,
      "outputChars": 600,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 26
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 3
    },
    {
      "provider": "openrouter-kimi-k2-6",
      "model": "moonshotai/kimi-k2.6",
      "test": "adapt-invoice",
      "scenario": "adapt",
      "runStartedAt": 1778655241225,
      "latencyMs": 246071,
      "inputTokens": 40324,
      "outputTokens": 19026,
      "outputChars": 2888,
      "valid": true,
      "dslParsed": true,
      "catalogErrors": 0,
      "catalogWarnings": 0,
      "issues": [],
      "rendered": {
        "pages": 1,
        "sizeKB": 34
      },
      "renderError": null,
      "error": null,
      "cleanReached": true,
      "skillCompliance": {
        "score": 1,
        "applicable": [
          "tableAuthoring",
          "templateVars"
        ],
        "modules": {
          "tableAuthoring": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          },
          "templateVars": {
            "score": 1,
            "errors": 0,
            "warnings": 0,
            "rules": []
          }
        }
      },
      "cyclesUsed": 2
    }
  ]
}