refactor: Simplify error handling and remove unused retry exceptions code

2025-06-03 11:14:59 +00:00 · 2024-11-07 13:02:04 -08:00 · 2024-11-07 13:02:04 -08:00 · 816fd5e65c
commit 816fd5e65c
parent 8d4175536f
3 changed files with 54 additions and 138 deletions
--- a/aider/coders/base_coder.py
+++ b/aider/coders/base_coder.py
@ -19,6 +19,7 @@ from json.decoder import JSONDecodeError
 from pathlib import Path
 from typing import List
 from aider.exceptions import LiteLLMExceptions
 from aider import __version__, models, prompts, urls, utils
 from aider.analytics import Analytics
 from aider.commands import Commands
@ -29,7 +30,7 @@ from aider.llm import litellm
 from aider.repo import ANY_GIT_ERROR, GitRepo
 from aider.repomap import RepoMap
 from aider.run_cmd import run_cmd
-from aider.sendchat import RETRY_TIMEOUT, retry_exceptions, send_completion
+from aider.sendchat import RETRY_TIMEOUT, send_completion
 from aider.utils import format_content, format_messages, format_tokens, is_image_file
 from ..dump import dump  # noqa: F401
@ -789,34 +790,9 @@ class Coder:
            self.num_reflections += 1
            message = self.reflected_message
-    def check_and_open_urls(self, exc: Exception) -> List[str]:
+    def check_and_open_urls(self, exc, friendly_msg=None):
        import openai
        """Check exception for URLs, offer to open in a browser, with user-friendly error msgs."""
        text = str(exc)
        friendly_msg = None
        if isinstance(exc, (openai.APITimeoutError, openai.APIConnectionError)):
            friendly_msg = (
                "There is a problem connecting to the API provider. Please try again later or check"
                " your model settings."
            )
        elif isinstance(exc, openai.RateLimitError):
            friendly_msg = (
                "The API provider's rate limits have been exceeded. Check with your provider or"
                " wait awhile and retry."
            )
        elif isinstance(exc, openai.InternalServerError):
            friendly_msg = (
                "The API provider seems to be down or overloaded. Please try again later."
            )
        elif isinstance(exc, openai.BadRequestError):
            friendly_msg = "The API provider refused the request as invalid?"
        elif isinstance(exc, openai.AuthenticationError):
            friendly_msg = (
                "The API provider refused your authentication. Please check that you are using a"
                " valid API key."
            )
        if friendly_msg:
            self.io.tool_warning(text)
@ -1152,8 +1128,6 @@ class Coder:
        return chunks
    def send_message(self, inp):
        import openai  # for error codes below
        self.cur_messages += [
            dict(role="user", content=inp),
        ]
@ -1173,6 +1147,8 @@ class Coder:
        retry_delay = 0.125
        litellm_ex = LiteLLMExceptions()
        self.usage_report = None
        exhausted = False
        interrupted = False
@ -1181,30 +1157,37 @@ class Coder:
                try:
                    yield from self.send(messages, functions=self.functions)
                    break
-                except retry_exceptions() as err:
+                except litellm_ex.exceptions_tuple() as err:
-                    # Print the error and its base classes
+                    ex_info = litellm_ex.get_ex_info(err)
                    # for cls in err.__class__.__mro__: dump(cls.__name__)
-                    retry_delay *= 2
+                    if ex_info.name == "ContextWindowExceededError":
-                    if retry_delay > RETRY_TIMEOUT:
+                        exhausted = True
                        self.mdstream = None
                        self.check_and_open_urls(err)
                        break
                    should_retry = ex_info.retry
                    if should_retry:
                        retry_delay *= 2
                        if retry_delay > RETRY_TIMEOUT:
                            should_retry = False
                    if not should_retry:
                        self.mdstream = None
                        self.check_and_open_urls(err, ex_info.description)
                        break
                    err_msg = str(err)
-                    self.io.tool_error(err_msg)
+                    if ex_info.description:
                        self.io.tool_output(err_msg)
                        self.io.tool_error(ex_info.description)
                    else:
                        self.io.tool_error(err_msg)
                    self.io.tool_output(f"Retrying in {retry_delay:.1f} seconds...")
                    time.sleep(retry_delay)
                    continue
                except KeyboardInterrupt:
                    interrupted = True
                    break
                except litellm.ContextWindowExceededError:
                    # The input is overflowing the context window!
                    exhausted = True
                    break
                except litellm.exceptions.BadRequestError as br_err:
                    self.io.tool_error(f"BadRequestError: {br_err}")
                    return
                except FinishReasonLength:
                    # We hit the output limit!
                    if not self.main_model.info.get("supports_assistant_prefill"):
@ -1219,12 +1202,8 @@ class Coder:
                        messages.append(
                            dict(role="assistant", content=self.multi_response_content, prefix=True)
                        )
                except (openai.APIError, openai.APIStatusError) as err:
                    # for cls in err.__class__.__mro__: dump(cls.__name__)
                    self.mdstream = None
                    self.check_and_open_urls(err)
                    break
                except Exception as err:
                    self.mdstream = None
                    lines = traceback.format_exception(type(err), err, err.__traceback__)
                    self.io.tool_warning("".join(lines))
                    self.io.tool_error(str(err))
--- a/aider/exceptions.py
+++ b/aider/exceptions.py
@ -1,37 +1,6 @@
 from dataclasses import dataclass
 def retry_exceptions():
    import httpx
    import openai
    return (
        # httpx
        httpx.ConnectError,
        httpx.RemoteProtocolError,
        httpx.ReadTimeout,
        #
        # litellm exceptions inherit from openai exceptions
        # https://docs.litellm.ai/docs/exception_mapping
        #
        # openai.BadRequestError,
        # litellm.ContextWindowExceededError,
        # litellm.ContentPolicyViolationError,
        #
        # openai.AuthenticationError,
        # openai.PermissionDeniedError,
        # openai.NotFoundError,
        #
        openai.APITimeoutError,
        openai.UnprocessableEntityError,
        openai.RateLimitError,
        openai.APIConnectionError,
        # openai.APIError,
        # openai.APIStatusError,
        openai.InternalServerError,
    )
@dataclass
 class ExInfo:
    name: str
@ -43,20 +12,20 @@ EXCEPTIONS = [
    ExInfo("APIConnectionError", True, None),
    ExInfo("APIError", True, None),
    ExInfo("APIResponseValidationError", True, None),
-    ExInfo("AuthenticationError", True, None),
+    ExInfo("AuthenticationError", False, "The API provider is not able to authenticate you. Check your API key."),
    ExInfo("AzureOpenAIError", True, None),
-    ExInfo("BadRequestError", True, None),
+    ExInfo("BadRequestError", False, None),
    ExInfo("BudgetExceededError", True, None),
-    ExInfo("ContentPolicyViolationError", True, None),
+    ExInfo("ContentPolicyViolationError", True, "The API provider has refused the request due to a safety policy about the content."),
-    ExInfo("ContextWindowExceededError", True, None),
+    ExInfo("ContextWindowExceededError", False, None), # special case handled in base_coder
-    ExInfo("InternalServerError", True, None),
+    ExInfo("InternalServerError", True, "The API provider's servers are down or overloaded."),
    ExInfo("InvalidRequestError", True, None),
    ExInfo("JSONSchemaValidationError", True, None),
-    ExInfo("NotFoundError", True, None),
+    ExInfo("NotFoundError", False, None),
    ExInfo("OpenAIError", True, None),
-    ExInfo("RateLimitError", True, None),
+    ExInfo("RateLimitError", True, "The API provider has rate limited you. Try again later or check your quotas."),
    ExInfo("RouterRateLimitError", True, None),
-    ExInfo("ServiceUnavailableError", True, None),
+    ExInfo("ServiceUnavailableError", True, "The API provider's servers are down or overloaded."),
    ExInfo("UnprocessableEntityError", True, None),
    ExInfo("UnsupportedParamsError", True, None),
 ]
@ -92,7 +61,7 @@ class LiteLLMExceptions:
    def get_ex_info(self, ex):
        """Return the ExInfo for a given exception instance"""
-        return self.exceptions.get(ex.__class__)
+        return self.exceptions.get(ex.__class__, ExInfo(None, None, None))
 litellm_ex = LiteLLMExceptions()
--- a/aider/sendchat.py
+++ b/aider/sendchat.py
@ -5,6 +5,7 @@ import time
 import backoff
 from aider.dump import dump  # noqa: F401
 from aider.exceptions import LiteLLMExceptions
 from aider.llm import litellm
 # from diskcache import Cache
@ -17,52 +18,6 @@ CACHE = None
 RETRY_TIMEOUT = 60
 def retry_exceptions():
    import httpx
    import openai
    return (
        # httpx
        httpx.ConnectError,
        httpx.RemoteProtocolError,
        httpx.ReadTimeout,
        #
        # litellm exceptions inherit from openai exceptions
        # https://docs.litellm.ai/docs/exception_mapping
        #
        # openai.BadRequestError,
        # litellm.ContextWindowExceededError,
        # litellm.ContentPolicyViolationError,
        #
        # openai.AuthenticationError,
        # openai.PermissionDeniedError,
        # openai.NotFoundError,
        #
        openai.APITimeoutError,
        openai.UnprocessableEntityError,
        openai.RateLimitError,
        openai.APIConnectionError,
        # openai.APIError,
        # openai.APIStatusError,
        openai.InternalServerError,
    )
 def lazy_litellm_retry_decorator(func):
    def wrapper(*args, **kwargs):
        decorated_func = backoff.on_exception(
            backoff.expo,
            retry_exceptions(),
            max_time=RETRY_TIMEOUT,
            on_backoff=lambda details: print(
                f"{details.get('exception', 'Exception')}\nRetry in {details['wait']:.1f} seconds."
            ),
        )(func)
        return decorated_func(*args, **kwargs)
    return wrapper
 def send_completion(
    model_name,
    messages,
@ -104,6 +59,8 @@ def send_completion(
 def simple_send_with_retries(model_name, messages, extra_params=None):
    litellm_ex = LiteLLMExceptions()
    retry_delay = 0.125
    while True:
        try:
@ -117,11 +74,22 @@ def simple_send_with_retries(model_name, messages, extra_params=None):
            _hash, response = send_completion(**kwargs)
            return response.choices[0].message.content
-        except retry_exceptions() as err:
+        except litellm_ex.exceptions_tuple() as err:
            ex_info = litellm_ex.get_ex_info(err)
            print(str(err))
-            retry_delay *= 2
+            if ex_info.description:
-            if retry_delay > RETRY_TIMEOUT:
+                print(ex_info.description)
            should_retry = ex_info.retry
            if should_retry:
                retry_delay *= 2
                if retry_delay > RETRY_TIMEOUT:
                    should_retry = False
            if not should_retry:
                break
            print(f"Retrying in {retry_delay:.1f} seconds...")
            time.sleep(retry_delay)
            continue