fix: Add cache headers for prompts when using a model with cache control

2025-05-30 17:24:59 +00:00 · 2024-08-19 13:34:57 -07:00 · 2024-08-19 13:34:57 -07:00 · b200bde319
commit b200bde319
parent b7e325be36
1 changed files with 24 additions and 20 deletions
--- a/aider/coders/base_coder.py
+++ b/aider/coders/base_coder.py
@ -66,8 +66,8 @@ class ChatChunks:
        return (
            self.system
            + self.examples
            + self.repo
            + self.readonly_files
            + self.repo
            + self.done
            + self.chat_files
            + self.cur
@ -130,6 +130,7 @@ class Coder:
    message_cost = 0.0
    message_tokens_sent = 0
    message_tokens_received = 0
    add_cache_headers = False
    @classmethod
    def create(
@ -205,18 +206,22 @@ class Coder:
        # Model
        main_model = self.main_model
        weak_model = main_model.weak_model
-        prefix = "Model:"
+
        output = f" {main_model.name}"
        if main_model.cache_control and self.cache_prompts:
            output += "⚡"
        output += " with"
        if main_model.info.get("supports_assistant_prefill"):
            output += " ♾️"
        output += f" {self.edit_format} edit format"
        if weak_model is not main_model:
-            prefix = "Models:"
+            prefix = "Main model"
-            output += f", weak model {weak_model.name}"
+        else:
-        lines.append(prefix + output)
+            prefix = "Model"
        output = f"{prefix}: {main_model.name} with {self.edit_format} edit format"
        if self.add_cache_headers:
            output += ", prompt cache"
        if main_model.info.get("supports_assistant_prefill"):
            output += ", infinite output"
        lines.append(output)
        if weak_model is not main_model:
            output = f"Weak model: {weak_model.name}"
            lines.append(output)
        # Repo
        if self.repo:
@ -293,7 +298,6 @@ class Coder:
        self.aider_commit_hashes = set()
        self.rejected_urls = set()
        self.abs_root_path_cache = {}
        self.cache_prompts = cache_prompts
        if not fnames:
            fnames = []
@ -347,6 +351,9 @@ class Coder:
        self.main_model = main_model
        if cache_prompts and self.main_model.cache_control:
            self.add_cache_headers = True
        self.show_diffs = show_diffs
        self.commands = commands or Commands(self.io, self)
@ -916,12 +923,8 @@ class Coder:
        if user_lang:
            platform_text += f"- Language: {user_lang}\n"
-        if self.cache_prompts:
+        dt = datetime.now().astimezone().strftime("%Y-%m-%d")
-            dt = datetime.now().astimezone().strftime("%Y-%m-%d")
+        platform_text += f"- Current date: {dt}"
            platform_text += f"- Current date: {dt}"
        else:
            dt = datetime.now().astimezone().strftime("%Y-%m-%dT%H:%M:%S%z")
            platform_text += f"- Current date/time: {dt}"
        prompt = prompt.format(
            fence=self.fence,
@ -1027,7 +1030,7 @@ class Coder:
    def format_messages(self):
        chunks = self.format_chat_chunks()
-        if self.cache_prompts and self.main_model.cache_control:
+        if self.add_cache_headers:
            chunks.add_cache_control_headers()
        msgs = chunks.all_messages()
@ -1476,6 +1479,7 @@ class Coder:
        cost = 0
        if completion and hasattr(completion, "usage") and completion.usage is not None:
            dump(completion.usage)
            prompt_tokens = completion.usage.prompt_tokens
            completion_tokens = completion.usage.completion_tokens
            cached_tokens = getattr(completion.usage, "prompt_cache_hit_tokens", 0) or getattr(