diff --git a/benchmark/benchmark.py b/benchmark/benchmark.py
index 4076769de..e6cf5a9d2 100755
--- a/benchmark/benchmark.py
+++ b/benchmark/benchmark.py
@@ -24,8 +24,8 @@ from dotenv import load_dotenv
 from plots import plot_refactoring
 from rich.console import Console
 
-from aider import models
-from aider.coders import Coder
+from aider import models, sendchat
+from aider.coders import Coder, base_coder
 from aider.dump import dump  # noqa: F401
 from aider.io import InputOutput
 
@@ -270,6 +270,11 @@ def main(
     if num_tests > 0:
         test_dnames = test_dnames[:num_tests]
 
+    # Don't give up when benchmarking
+    LONG_TIMEOUT = 24 * 60 * 60
+    sendchat.RETRY_TIMEOUT = LONG_TIMEOUT
+    base_coder.RETRY_TIMEOUT = LONG_TIMEOUT
+
     if threads == 1:
         all_results = []
         for testname in test_dnames: