From ee5d72301ae31ceb435ae984618f8ce0cf8069cc Mon Sep 17 00:00:00 2001 From: Paul Gauthier Date: Fri, 24 Jan 2025 08:47:25 -0800 Subject: [PATCH] copy --- aider/models.py | 2 +- aider/website/_data/r1_architect.yml | 10 +++--- aider/website/_posts/2025-01-24-r1-sonnet.md | 34 ++++++++++++++++++++ 3 files changed, 40 insertions(+), 6 deletions(-) diff --git a/aider/models.py b/aider/models.py index 6e91d6aab..97575993b 100644 --- a/aider/models.py +++ b/aider/models.py @@ -841,7 +841,7 @@ MODEL_SETTINGS = [ use_repo_map=True, streaming=False, use_temperature=False, - extra_params=dict(extra_body=dict(reasoning_effort="high")), + # extra_params=dict(extra_body=dict(reasoning_effort="high")), ), ModelSettings( "openrouter/qwen/qwen-2.5-coder-32b-instruct", diff --git a/aider/website/_data/r1_architect.yml b/aider/website/_data/r1_architect.yml index c036c7de8..5467e0fc7 100644 --- a/aider/website/_data/r1_architect.yml +++ b/aider/website/_data/r1_architect.yml @@ -23,7 +23,7 @@ exhausted_context_windows: 0 test_timeouts: 5 total_tests: 225 - command: aider --model deepseek/deepseek-reasoner + command: aider --architect --model r1 --editor-model sonnet date: 2025-01-23 versions: 0.72.3.dev seconds_per_case: 251.6 @@ -49,7 +49,7 @@ exhausted_context_windows: 1 test_timeouts: 5 total_tests: 225 - command: aider --model deepseek/deepseek-reasoner + command: aider --model r1 date: 2025-01-20 versions: 0.71.2.dev seconds_per_case: 113.7 @@ -76,7 +76,7 @@ exhausted_context_windows: 0 test_timeouts: 2 total_tests: 225 - command: aider --model openrouter/openai/o1 + command: aider --model o1 date: 2024-12-21 versions: 0.69.2.dev seconds_per_case: 133.2 @@ -103,7 +103,7 @@ exhausted_context_windows: 0 test_timeouts: 8 total_tests: 225 - command: aider --model deepseek/deepseek-chat + command: aider --model deepseek date: 2024-12-25 versions: 0.69.2.dev seconds_per_case: 34.8 @@ -131,7 +131,7 @@ exhausted_context_windows: 1 test_timeouts: 8 total_tests: 225 - command: aider --model claude-3-5-sonnet-20241022 + command: aider --model sonnet date: 2025-01-17 versions: 0.71.2.dev seconds_per_case: 21.4 diff --git a/aider/website/_posts/2025-01-24-r1-sonnet.md b/aider/website/_posts/2025-01-24-r1-sonnet.md index ac74ee7b5..c7d737e76 100644 --- a/aider/website/_posts/2025-01-24-r1-sonnet.md +++ b/aider/website/_posts/2025-01-24-r1-sonnet.md @@ -29,6 +29,40 @@ This is in contrast to the first wave of thinking models like o1-preview and o1- which improved when paired with many different editor models. +## Try it + +Once you [install aider](https://aider.chat/docs/install.html), +you can use aider, R1 and Sonnet like this: + +```bash +export DEEPSEEK_API_KEY= +export ANTHROPIC_API_KEY= + +aider --architect --model r1 --editor-model sonnet +``` + +Or if you have an [OpenRouter](https://openrouter.ai) account: + +```bash +export OPENROUTER_API_KEY= + +aider --architect --model openrouter/deepseek/deepseek-r1 --editor-model openrouter/anthropic/claude-3.5-sonnet +``` + +## Thinking output + +There has been +[some recent discussion](https://github.com/Aider-AI/aider/pull/2973) +about extracting the `` tokens from R1's responses +and feeding them to Sonnet. +That was an interesting experiment, for sure. + +To be clear, the results above are *not* using R1's thinking tokens, just the normal +final output. +R1 is configured in aider's standard architect role with Sonnet as editor. +The benchmark results that used the thinking tokens appear to be worse than +the architect/editor results shared here. + ## Results