{"model":{"slug":"openrouter/x-ai/grok-4.3","display_name":"xAI: Grok 4.3","api_model_id":"x-ai/grok-4.3","family_slug":"grok","added_at":"2026-04-30","settings_suffix":""},"aggregates":{"avg_score":59.131206,"tasks_attempted":282,"tasks_passed":133,"tasks_attempted_distinct":64,"tasks_passed_attempt_1":38,"tasks_passed_attempt_2_only":10,"pass_at_n":0.75,"avg_cost_usd":0.032601,"latency_p50_ms":161741,"latency_p95_ms":207741,"pass_rate_ci":{"lower":0.6318349082561628,"upper":0.8398520802582591},"pass_hat_at_n":0.609375,"cost_per_pass_usd":0.043468,"run_count":3,"verified_runs":0},"settings":{"temperature":null,"thinking_budget":null,"tokens_avg_per_run":313946,"consistency_pct":76.56},"history":[{"run_id":"8306da4a-2147-463d-ae9b-1e1b7aeb4fdd","ts":"2026-05-05T13:59:43.150Z","score":61.820652,"cost_usd":0.670221,"tier":"claimed"},{"run_id":"b2f4e3fd-6f2e-463f-856c-4ba33d7f3390","ts":"2026-05-05T11:14:16.474Z","score":56.958763,"cost_usd":0.736483,"tier":"claimed"},{"run_id":"fb3cc98e-b018-42f9-83bf-09044a40e810","ts":"2026-05-05T08:29:04.134Z","score":58.736559,"cost_usd":0.679742,"tier":"claimed"}],"failure_modes":[{"code":"AL0104","count":131,"pct":0.224315,"example_message":"Syntax error, '{' expected"},{"code":"AL0132","count":112,"pct":0.191781,"example_message":"'Record Customer' does not contain a definition for 'Preferred Contact Method'"},{"code":"AL0000","count":95,"pct":0.162671,"example_message":"App generation failed"},{"code":"AL0107","count":40,"pct":0.068493,"example_message":"Syntax error, identifier expected. Provide a valid name (letters, digits, and underscores only)."},{"code":"AL0111","count":30,"pct":0.05137,"example_message":"Semicolon expected. Add a semicolon (;) to terminate the statement."},{"code":"AL0198","count":30,"pct":0.05137,"example_message":"Expected one of the application object keywords (table, tableextension, page, pageextension, pagecustomization, profile, profileextension, codeunit, report, reportextension, xmlport, query, controladdin, dotnet, enum, enumextension, interface, permissionset, permissionsetextension, entitlement)"},{"code":"AL0360","count":24,"pct":0.041096,"example_message":"Text literal was not properly terminated. Use the character ' to terminate the literal."},{"code":"AL0175","count":18,"pct":0.030822,"example_message":"Operator '=' cannot be applied to operands of type 'Joker' and 'Integer'"},{"code":"AL0196","count":14,"pct":0.023973,"example_message":"The call is ambiguous between the method 'Add(Text, Boolean)' defined in Class 'JsonObject' by the extension '' and the method 'Add(Text, Char)' defined in Class 'JsonObject' by the extension ''."},{"code":"AL0519","count":14,"pct":0.023973,"example_message":"'Key' is not valid value in this context."}],"recent_runs":[{"run_id":"8306da4a-2147-463d-ae9b-1e1b7aeb4fdd","ts":"2026-05-05T13:59:43.150Z","score":61.820652,"cost_usd":0.670221,"tier":"claimed"},{"run_id":"b2f4e3fd-6f2e-463f-856c-4ba33d7f3390","ts":"2026-05-05T11:14:16.474Z","score":56.958763,"cost_usd":0.736483,"tier":"claimed"},{"run_id":"fb3cc98e-b018-42f9-83bf-09044a40e810","ts":"2026-05-05T08:29:04.134Z","score":58.736559,"cost_usd":0.679742,"tier":"claimed"}]}