{"model":{"slug":"anthropic/claude-sonnet-4-6","display_name":"Claude Sonnet 4 6","api_model_id":"claude-sonnet-4-6","family_slug":"claude","added_at":"2026-05-04T16:43:38.341Z","settings_suffix":""},"aggregates":{"avg_score":64.972015,"tasks_attempted":268,"tasks_passed":146,"tasks_attempted_distinct":64,"tasks_passed_attempt_1":39,"tasks_passed_attempt_2_only":11,"pass_at_n":0.78125,"avg_cost_usd":0.109307,"latency_p50_ms":147062,"latency_p95_ms":185558,"pass_rate_ci":{"lower":0.665669836692222,"upper":0.8649780253865025},"pass_hat_at_n":0.734375,"cost_per_pass_usd":0.139912,"run_count":3,"verified_runs":0},"settings":{"temperature":null,"thinking_budget":null,"tokens_avg_per_run":232772,"consistency_pct":93.75},"history":[{"run_id":"b9ca725e-7be3-4b1b-9a7e-5940440ad41b","ts":"2026-05-04T23:37:17.408Z","score":64.185393,"cost_usd":2.35494,"tier":"claimed"},{"run_id":"6892ef4f-9566-4fed-aaae-641b5829730e","ts":"2026-05-04T20:18:33.860Z","score":64.444444,"cost_usd":2.361459,"tier":"claimed"},{"run_id":"75466b2c-00f2-4ba5-b7f9-e48607416da8","ts":"2026-05-04T16:43:38.341Z","score":66.292135,"cost_usd":2.27922,"tier":"claimed"}],"failure_modes":[{"code":"AL0104","count":604,"pct":0.553621,"example_message":"Syntax error, ':' expected"},{"code":"AL0111","count":92,"pct":0.084326,"example_message":"Semicolon expected. Add a semicolon (;) to terminate the statement."},{"code":"AL0000","count":77,"pct":0.070577,"example_message":"App generation failed"},{"code":"AL0224","count":64,"pct":0.058662,"example_message":"Expression expected. Provide a valid expression (variable, constant, calculation, or method call)."},{"code":"AL0198","count":36,"pct":0.032997,"example_message":"Expected one of the application object keywords (table, tableextension, page, pageextension, pagecustomization, profile, profileextension, codeunit, report, reportextension, xmlport, query, controladdin, dotnet, enum, enumextension, interface, permissionset, permissionsetextension, entitlement)"},{"code":"AL0620","count":36,"pct":0.032997,"example_message":"Preprocessor directives must appear as the first non-whitespace character on a line."},{"code":"AL0107","count":29,"pct":0.026581,"example_message":"Syntax error, identifier expected. Provide a valid name (letters, digits, and underscores only)."},{"code":"AL0183","count":24,"pct":0.021998,"example_message":"Unexpected character '`'. Remove the invalid character or check if a special character needs escaping."},{"code":"AL0105","count":23,"pct":0.021082,"example_message":"Syntax error, identifier expected; 'key' is a keyword"},{"code":"AL0114","count":16,"pct":0.014665,"example_message":"Syntax error, integer literal expected. Provide a numeric value (e.g., 0, 1, 42)."}],"recent_runs":[{"run_id":"b9ca725e-7be3-4b1b-9a7e-5940440ad41b","ts":"2026-05-04T23:37:17.408Z","score":64.185393,"cost_usd":2.35494,"tier":"claimed"},{"run_id":"6892ef4f-9566-4fed-aaae-641b5829730e","ts":"2026-05-04T20:18:33.860Z","score":64.444444,"cost_usd":2.361459,"tier":"claimed"},{"run_id":"75466b2c-00f2-4ba5-b7f9-e48607416da8","ts":"2026-05-04T16:43:38.341Z","score":66.292135,"cost_usd":2.27922,"tier":"claimed"}]}