mirror of
https://github.com/Aider-AI/aider.git
synced 2025-06-03 11:14:59 +00:00
Added gpt-4-turbo-2024-04-09 (diff) to the leaderboard
This commit is contained in:
parent
efc9e56b23
commit
6d2b9d6699
2 changed files with 46 additions and 1 deletions
|
@ -426,3 +426,25 @@
|
||||||
seconds_per_case: 6.0
|
seconds_per_case: 6.0
|
||||||
total_cost: 0.0000
|
total_cost: 0.0000
|
||||||
|
|
||||||
|
- dirname: 2024-04-12-22-18-20--gpt-4-turbo-2024-04-09-plain-diff
|
||||||
|
test_cases: 33
|
||||||
|
model: gpt-4-turbo-2024-04-09 (diff)
|
||||||
|
edit_format: diff
|
||||||
|
commit_hash: 9b2e697-dirty
|
||||||
|
pass_rate_1: 48.5
|
||||||
|
pass_rate_2: 57.6
|
||||||
|
percent_cases_well_formed: 100.0
|
||||||
|
error_outputs: 15
|
||||||
|
num_malformed_responses: 0
|
||||||
|
user_asks: 15
|
||||||
|
lazy_comments: 0
|
||||||
|
syntax_errors: 0
|
||||||
|
indentation_errors: 0
|
||||||
|
exhausted_context_windows: 0
|
||||||
|
test_timeouts: 0
|
||||||
|
command: aider --model gpt-4-turbo-2024-04-09
|
||||||
|
date: 2024-04-12
|
||||||
|
versions: 0.28.1-dev
|
||||||
|
seconds_per_case: 17.6
|
||||||
|
total_cost: 1.6205
|
||||||
|
|
|
@ -120,4 +120,27 @@
|
||||||
date: 2024-05-13
|
date: 2024-05-13
|
||||||
versions: 0.34.1-dev
|
versions: 0.34.1-dev
|
||||||
seconds_per_case: 27.8
|
seconds_per_case: 27.8
|
||||||
total_cost: 0.0000
|
total_cost: 0.0000
|
||||||
|
|
||||||
|
- dirname: 2024-04-10-13-26-18--refac-gpt-4-turbo-2024-04-09-diff
|
||||||
|
test_cases: 88
|
||||||
|
model: gpt-4-turbo-2024-04-09 (diff)
|
||||||
|
edit_format: diff
|
||||||
|
commit_hash: 7875418
|
||||||
|
pass_rate_1: 21.4
|
||||||
|
percent_cases_well_formed: 6.8
|
||||||
|
error_outputs: 247
|
||||||
|
num_malformed_responses: 82
|
||||||
|
user_asks: 1
|
||||||
|
lazy_comments: 2
|
||||||
|
syntax_errors: 3
|
||||||
|
indentation_errors: 8
|
||||||
|
exhausted_context_windows: 0
|
||||||
|
test_timeouts: 0
|
||||||
|
command: aider --model gpt-4-turbo-2024-04-09
|
||||||
|
date: 2024-04-10
|
||||||
|
versions: 0.28.1-dev
|
||||||
|
seconds_per_case: 67.8
|
||||||
|
total_cost: 20.4889
|
||||||
|
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue