From fd21f5195dd88587068ad776111adc13f150999e Mon Sep 17 00:00:00 2001 From: Paul Gauthier Date: Fri, 14 Mar 2025 18:19:20 -0700 Subject: [PATCH] chore: Update polyglot leaderboard entry with new test results --- aider/website/_data/polyglot_leaderboard.yml | 32 ++++++++++---------- 1 file changed, 16 insertions(+), 16 deletions(-) diff --git a/aider/website/_data/polyglot_leaderboard.yml b/aider/website/_data/polyglot_leaderboard.yml index 486167a55..04b1b0676 100644 --- a/aider/website/_data/polyglot_leaderboard.yml +++ b/aider/website/_data/polyglot_leaderboard.yml @@ -729,28 +729,28 @@ seconds_per_case: 137.4 total_cost: 0 -- dirname: 2025-03-13-20-46-30--cmda-whole +- dirname: 2025-03-14-23-40-00--cmda-quality-whole2 test_cases: 225 - model: command-a-03-2025 + model: command-a-03-2025-quality edit_format: whole - commit_hash: 024b913-dirty + commit_hash: a1aa63f pass_rate_1: 2.2 - pass_rate_2: 4.9 + pass_rate_2: 12.0 pass_num_1: 5 - pass_num_2: 11 - percent_cases_well_formed: 100.0 - error_outputs: 38 - num_malformed_responses: 0 - num_with_malformed_responses: 0 - user_asks: 231 + pass_num_2: 27 + percent_cases_well_formed: 99.6 + error_outputs: 2 + num_malformed_responses: 1 + num_with_malformed_responses: 1 + user_asks: 215 lazy_comments: 0 syntax_errors: 0 indentation_errors: 0 - exhausted_context_windows: 0 - test_timeouts: 2 + exhausted_context_windows: 1 + test_timeouts: 4 total_tests: 225 - command: aider --model cohere_chat/command-a-03-2025 - date: 2025-03-13 - versions: 0.76.3.dev - seconds_per_case: 106.3 + command: OPENAI_API_BASE=https://api.cohere.ai/compatibility/v1 aider --model openai/command-a-03-2025-quality + date: 2025-03-14 + versions: 0.77.1.dev + seconds_per_case: 85.1 total_cost: 0.0000 \ No newline at end of file