{"model":{"slug":"anthropic/claude-haiku-4-5-20251001","display_name":"Claude Haiku 4 5 20251001","api_model_id":"claude-haiku-4-5-20251001","family_slug":"claude","added_at":"2026-05-05T08:29:04.135Z","settings_suffix":""},"aggregates":{"avg_score":44.370861,"tasks_attempted":302,"tasks_passed":109,"tasks_attempted_distinct":64,"tasks_passed_attempt_1":28,"tasks_passed_attempt_2_only":10,"pass_at_n":0.59375,"avg_cost_usd":0.000024,"latency_p50_ms":41681,"latency_p95_ms":150913,"pass_rate_ci":{"lower":0.471449865045497,"upper":0.7054327556474111},"pass_hat_at_n":0.53125,"cost_per_pass_usd":0.000041,"run_count":3,"verified_runs":0},"settings":{"temperature":null,"thinking_budget":null,"tokens_avg_per_run":175927,"consistency_pct":92.19},"history":[{"run_id":"4438b0ca-feb4-4509-b231-3d768333cae3","ts":"2026-05-05T13:59:43.150Z","score":44.125,"cost_usd":0.00057,"tier":"claimed"},{"run_id":"eaf4e885-3a23-49ef-9c33-2023e972c577","ts":"2026-05-05T11:14:16.474Z","score":43.688119,"cost_usd":0.000481,"tier":"claimed"},{"run_id":"81f8056f-69e4-4948-b39c-e71d887397fa","ts":"2026-05-05T08:29:04.135Z","score":45.29703,"cost_usd":0.000514,"tier":"claimed"}],"failure_modes":[{"code":"AL0104","count":348,"pct":0.284314,"example_message":"Syntax error, 'end' expected"},{"code":"AL0000","count":153,"pct":0.125,"example_message":"App generation failed"},{"code":"AL0185","count":142,"pct":0.116013,"example_message":"Interface 'INotificationChannel' is missing"},{"code":"AL0132","count":85,"pct":0.069444,"example_message":"'System' does not contain a definition for 'CreateSequentialGuid'"},{"code":"AL0111","count":79,"pct":0.064542,"example_message":"Semicolon expected. Add a semicolon (;) to terminate the statement."},{"code":"AL0107","count":75,"pct":0.061275,"example_message":"Syntax error, identifier expected. Provide a valid name (letters, digits, and underscores only)."},{"code":"AL0118","count":54,"pct":0.044118,"example_message":"The name 'StrToInt' does not exist in the current context."},{"code":"AL0198","count":41,"pct":0.033497,"example_message":"Expected one of the application object keywords (table, tableextension, page, pageextension, pagecustomization, profile, profileextension, codeunit, report, reportextension, xmlport, query, controladdin, dotnet, enum, enumextension, interface, permissionset, permissionsetextension, entitlement)"},{"code":"AL0360","count":36,"pct":0.029412,"example_message":"Text literal was not properly terminated. Use the character ' to terminate the literal."},{"code":"AL0519","count":26,"pct":0.021242,"example_message":"'Key' is not valid value in this context."}],"recent_runs":[{"run_id":"4438b0ca-feb4-4509-b231-3d768333cae3","ts":"2026-05-05T13:59:43.150Z","score":44.125,"cost_usd":0.00057,"tier":"claimed"},{"run_id":"eaf4e885-3a23-49ef-9c33-2023e972c577","ts":"2026-05-05T11:14:16.474Z","score":43.688119,"cost_usd":0.000481,"tier":"claimed"},{"run_id":"81f8056f-69e4-4948-b39c-e71d887397fa","ts":"2026-05-05T08:29:04.135Z","score":45.29703,"cost_usd":0.000514,"tier":"claimed"}]}