From 2269f56aed15cd456c5e99a87ce4b330418f307c Mon Sep 17 00:00:00 2001 From: Paul Gauthier Date: Wed, 8 May 2024 15:38:41 -0700 Subject: [PATCH] updated gpt-0125 refac --- _data/refactor_leaderboard.yml | 28 ++++++++++++++-------------- 1 file changed, 14 insertions(+), 14 deletions(-) diff --git a/_data/refactor_leaderboard.yml b/_data/refactor_leaderboard.yml index 23e42d64b..7af3a87ac 100644 --- a/_data/refactor_leaderboard.yml +++ b/_data/refactor_leaderboard.yml @@ -59,27 +59,27 @@ seconds_per_case: 42.4 total_cost: 19.6556 -- dirname: 2024-01-25-22-07-21--jan-gpt-4-0125-preview-udiff +- dirname: 2024-05-08-22-25-41--may-refac-gpt-4-0125-preview-ex-sys test_cases: 89 model: gpt-4-0125-preview edit_format: udiff - commit_hash: 0fbd702 - pass_rate_1: 43.8 - percent_cases_well_formed: 74.2 - error_outputs: 51 - num_malformed_responses: 23 + commit_hash: bf09bd3-dirty + pass_rate_1: 33.7 + percent_cases_well_formed: 47.2 + error_outputs: 142 + num_malformed_responses: 47 user_asks: 0 lazy_comments: 1 - syntax_errors: 4 - indentation_errors: 11 - exhausted_context_windows: 1 + syntax_errors: 2 + indentation_errors: 16 + exhausted_context_windows: 0 test_timeouts: 0 command: aider --model gpt-4-0125-preview - date: 2024-01-25 - versions: 0.22.1-dev - seconds_per_case: 70.4 - total_cost: 43.3437 - + date: 2024-05-08 + versions: 0.33.1-dev + seconds_per_case: 56.6 + total_cost: 20.3270 + - dirname: 2024-05-08-21-24-16--may-refac-gpt-4-1106-preview test_cases: 89 model: gpt-4-1106-preview