added refac leaderboard

This commit is contained in:
Paul Gauthier 2024-05-04 11:05:32 -07:00
parent b02320b08f
commit e524dd9203
3 changed files with 92 additions and 9 deletions

View file

@ -0,0 +1,16 @@
model,second,first,format,command,version,commits,date
claude-3-opus-20240229,68.4,53.4,diff,aider --opus,0.30.1,f4b1797,5/2/24
claude-3-sonnet-20240229,54.9,43.6,whole,aider --sonnet,0.25.0,a5f8076,3/6/24
Command-R+,29.3,22.6,whole,aider --model command-r-plus,0.28.0,a06c927,4/20/24
Deepseek Coder,54.5,47,whole,aider --model openai/deepseek-coder,0.30.1,c07f793,4/29/24
gemini-1.5-pro-latest,57.1,45.9,diff-fenced,aider --model gemini/gemini-1.5-pro-latest,0.32.0,5d32dd7,5/3/24
gpt-3.5-turbo-0125,49.6,39.8,whole,aider -3,0.22.0,da14474,2/2/24
gpt-3.5-turbo-0301,57.9,50.4,whole,aider --model gpt-3.5-turbo-0301,0.16.4-dev,44388db-dirty,11/6/23
gpt-3.5-turbo-0613,50.4,38.3,whole,aider --model gpt-3.5-turbo-0613,0.16.4-dev,93aa497-dirty,11/7/23
gpt-3.5-turbo-1106,56.1,45.5,whole,aider --model gpt-3.5-turbo-1106,0.30.1,7b14d77,4/30/24
gpt-4-0125-preview,66.2,55.6,udiff,aider --model gpt-4-0125-preview,0.22.1-dev,edcf9b1,1/25/24
gpt-4-0314,66.2,50.4,diff,aider --model gpt-4-0314,0.31.2-dev,0d43468,5/4/24
gpt-4-0613,67.7,46.6,diff,aider -4,0.18.1,3aa17c4,12/16/23
gpt-4-1106-preview,63.2,57.1,udiff,aider,0.31.2-dev,1981105-dirty,5/4/24
gpt-4-turbo-2024-04-09,64.4,49.2,diff,aider --gpt-4-turbo,0.30.1,e610e5b,5/1/24
Llama3 70B,49.2,38.6,diff,aider --model groq/llama3-70b-8192,0.32.0,b5bb453,5/3/24
1 model second first format command version commits date
2 claude-3-opus-20240229 68.4 53.4 diff aider --opus 0.30.1 f4b1797 5/2/24
3 claude-3-sonnet-20240229 54.9 43.6 whole aider --sonnet 0.25.0 a5f8076 3/6/24
4 Command-R+ 29.3 22.6 whole aider --model command-r-plus 0.28.0 a06c927 4/20/24
5 Deepseek Coder 54.5 47 whole aider --model openai/deepseek-coder 0.30.1 c07f793 4/29/24
6 gemini-1.5-pro-latest 57.1 45.9 diff-fenced aider --model gemini/gemini-1.5-pro-latest 0.32.0 5d32dd7 5/3/24
7 gpt-3.5-turbo-0125 49.6 39.8 whole aider -3 0.22.0 da14474 2/2/24
8 gpt-3.5-turbo-0301 57.9 50.4 whole aider --model gpt-3.5-turbo-0301 0.16.4-dev 44388db-dirty 11/6/23
9 gpt-3.5-turbo-0613 50.4 38.3 whole aider --model gpt-3.5-turbo-0613 0.16.4-dev 93aa497-dirty 11/7/23
10 gpt-3.5-turbo-1106 56.1 45.5 whole aider --model gpt-3.5-turbo-1106 0.30.1 7b14d77 4/30/24
11 gpt-4-0125-preview 66.2 55.6 udiff aider --model gpt-4-0125-preview 0.22.1-dev edcf9b1 1/25/24
12 gpt-4-0314 66.2 50.4 diff aider --model gpt-4-0314 0.31.2-dev 0d43468 5/4/24
13 gpt-4-0613 67.7 46.6 diff aider -4 0.18.1 3aa17c4 12/16/23
14 gpt-4-1106-preview 63.2 57.1 udiff aider 0.31.2-dev 1981105-dirty 5/4/24
15 gpt-4-turbo-2024-04-09 64.4 49.2 diff aider --gpt-4-turbo 0.30.1 e610e5b 5/1/24
16 Llama3 70B 49.2 38.6 diff aider --model groq/llama3-70b-8192 0.32.0 b5bb453 5/3/24