From ae539fb1f584bef503dc975a7b4dd141f3cdc91b Mon Sep 17 00:00:00 2001 From: Paul Gauthier Date: Wed, 25 Jun 2025 15:30:36 -0700 Subject: [PATCH] copy --- aider/website/_data/polyglot_leaderboard.yml | 85 +++++++++++++------- 1 file changed, 58 insertions(+), 27 deletions(-) diff --git a/aider/website/_data/polyglot_leaderboard.yml b/aider/website/_data/polyglot_leaderboard.yml index 260570dc9..1801b4d92 100644 --- a/aider/website/_data/polyglot_leaderboard.yml +++ b/aider/website/_data/polyglot_leaderboard.yml @@ -1093,32 +1093,6 @@ seconds_per_case: 12.0 total_cost: 0.4281 -- dirname: 2025-04-16-21-20-55--o3-high-diff-temp0-exsys - test_cases: 225 - model: o3 (high) - edit_format: diff - commit_hash: 24805ff-dirty - pass_rate_1: 36.9 - pass_rate_2: 79.6 - pass_num_1: 83 - pass_num_2: 179 - percent_cases_well_formed: 95.1 - error_outputs: 11 - num_malformed_responses: 11 - num_with_malformed_responses: 11 - user_asks: 110 - lazy_comments: 0 - syntax_errors: 0 - indentation_errors: 0 - exhausted_context_windows: 0 - test_timeouts: 2 - total_tests: 225 - command: aider --model o3 - date: 2025-04-16 - versions: 0.82.1.dev - seconds_per_case: 113.8 - total_cost: 111.0325 - - dirname: 2025-04-16-22-01-58--o4-mini-high-diff-exsys test_cases: 225 model: o4-mini (high) @@ -1562,4 +1536,61 @@ date: 2025-06-06 versions: 0.84.1.dev seconds_per_case: 716.6 - total_cost: 4.8016 \ No newline at end of file + total_cost: 4.8016 + +- dirname: 2025-06-25-21-04-24--o3-price-reduction-high + test_cases: 225 + model: o3 (high) + edit_format: diff + commit_hash: c48fea6 + reasoning_effort: high + pass_rate_1: 40.0 + pass_rate_2: 81.3 + pass_num_1: 90 + pass_num_2: 183 + percent_cases_well_formed: 94.7 + error_outputs: 25 + num_malformed_responses: 23 + num_with_malformed_responses: 12 + user_asks: 116 + lazy_comments: 0 + syntax_errors: 0 + indentation_errors: 0 + exhausted_context_windows: 1 + prompt_tokens: 3148932 + completion_tokens: 2047615 + test_timeouts: 2 + total_tests: 225 + command: aider --model o3 --reasoning-effort high + date: 2025-06-25 + versions: 0.84.1.dev + seconds_per_case: 197.3 + total_cost: 21.2259 + +- dirname: 2025-06-25-20-30-16--o3-price-reduction + test_cases: 225 + model: o3 + edit_format: diff + commit_hash: c48fea6 + pass_rate_1: 40.9 + pass_rate_2: 76.9 + pass_num_1: 92 + pass_num_2: 173 + percent_cases_well_formed: 93.8 + error_outputs: 22 + num_malformed_responses: 22 + num_with_malformed_responses: 14 + user_asks: 108 + lazy_comments: 2 + syntax_errors: 0 + indentation_errors: 0 + exhausted_context_windows: 0 + prompt_tokens: 2893189 + completion_tokens: 1154767 + test_timeouts: 1 + total_tests: 225 + command: aider --model o3 + date: 2025-06-25 + versions: 0.84.1.dev + seconds_per_case: 101.7 + total_cost: 13.7517 \ No newline at end of file