avoid stomping extra_params[max_tokens]=1 in cache warming, which causes loop of 1 token infinite-output responses with prefill models #1842 #1841

2025-05-31 01:35:00 +00:00 · 2024-09-30 14:22:11 -07:00 · 2024-09-30 14:22:11 -07:00 · f2e1e17741
commit f2e1e17741
parent 8fb0362b47
1 changed files with 1 additions and 1 deletions
--- a/aider/coders/base_coder.py
+++ b/aider/coders/base_coder.py
@ -1073,7 +1073,7 @@ class Coder:
                self.warming_pings_left -= 1
                self.next_cache_warm = time.time() + delay

-                kwargs = self.main_model.extra_params or dict()
+                kwargs = dict(self.main_model.extra_params) or dict()
                kwargs["max_tokens"] = 1

                try: