chore: Update polyglot leaderboard entry with new test results

This commit is contained in:
Paul Gauthier 2025-03-14 18:19:20 -07:00 committed by Paul Gauthier (aider)
parent a1aa63fa06
commit fd21f5195d

View file

@ -729,28 +729,28 @@
seconds_per_case: 137.4
total_cost: 0
- dirname: 2025-03-13-20-46-30--cmda-whole
- dirname: 2025-03-14-23-40-00--cmda-quality-whole2
test_cases: 225
model: command-a-03-2025
model: command-a-03-2025-quality
edit_format: whole
commit_hash: 024b913-dirty
commit_hash: a1aa63f
pass_rate_1: 2.2
pass_rate_2: 4.9
pass_rate_2: 12.0
pass_num_1: 5
pass_num_2: 11
percent_cases_well_formed: 100.0
error_outputs: 38
num_malformed_responses: 0
num_with_malformed_responses: 0
user_asks: 231
pass_num_2: 27
percent_cases_well_formed: 99.6
error_outputs: 2
num_malformed_responses: 1
num_with_malformed_responses: 1
user_asks: 215
lazy_comments: 0
syntax_errors: 0
indentation_errors: 0
exhausted_context_windows: 0
test_timeouts: 2
exhausted_context_windows: 1
test_timeouts: 4
total_tests: 225
command: aider --model cohere_chat/command-a-03-2025
date: 2025-03-13
versions: 0.76.3.dev
seconds_per_case: 106.3
command: OPENAI_API_BASE=https://api.cohere.ai/compatibility/v1 aider --model openai/command-a-03-2025-quality
date: 2025-03-14
versions: 0.77.1.dev
seconds_per_case: 85.1
total_cost: 0.0000