feat: Create PatchCoder for applying patch-formatted code edits

2025-06-01 02:05:00 +00:00 · 2025-04-14 14:36:24 -07:00 · 2025-04-14 14:36:24 -07:00 · 8cc8027b40
commit 8cc8027b40
parent ffb743e108
1 changed files with 282 additions and 0 deletions
--- a/aider/coders/patch_coder.py
+++ b/aider/coders/patch_coder.py
@ -0,0 +1,282 @@
 import pathlib
 import re
 from dataclasses import dataclass, field
 from enum import Enum
 from typing import Dict, List, Optional, Tuple
 from ..dump import dump  # noqa: F401
 from .base_coder import Coder
 # Adapted structures and types from apply_patch.py for parsing and applying
 class ActionType(str, Enum):
    ADD = "Add"
    DELETE = "Delete"
    UPDATE = "Update"
@dataclass
 class Chunk:
    orig_index: int = -1
    del_lines: List[str] = field(default_factory=list)
    ins_lines: List[str] = field(default_factory=list)
    context_before: List[str] = field(default_factory=list) # Store context for validation/application
@dataclass
 class PatchAction:
    type: ActionType
    path: str
    new_content: Optional[str] = None # For Add
    chunks: List[Chunk] = field(default_factory=list) # For Update
    move_path: Optional[str] = None # For Update
 class PatchCoder(Coder):
    """
    A coder that uses a custom patch format for code modifications,
    inspired by the format described in tmp.gpt41edits.txt.
    """
    edit_format = "patch"
    gpt_prompts = None  # Prompts to be added later
    def get_edits(self) -> List[PatchAction]:
        """
        Parses the LLM response content (containing the patch) into a list of PatchAction objects.
        """
        content = self.partial_response_content
        if not content or not content.strip():
            return []
        try:
            parsed_edits = self._parse_patch_content(content)
            return parsed_edits
        except Exception as e:
            raise ValueError(f"Error parsing patch content: {e}")
    def _parse_patch_content(self, content: str) -> List[PatchAction]:
        """
        Parses the patch content string into a list of PatchAction objects.
        This is a simplified parser based on the expected format. A more robust
        implementation would adapt the full parser logic from apply_patch.py,
        including context finding and validation against current file content.
        """
        edits = []
        lines = content.splitlines()
        i = 0
        in_patch = False
        current_action = None
        while i < len(lines):
            line = lines[i]
            i += 1
            if line.strip() == "*** Begin Patch":
                in_patch = True
                continue
            if not in_patch:
                continue
            if line.strip() == "*** End Patch":
                if current_action:
                    edits.append(current_action)
                in_patch = False
                break # End of patch found
            # Match Action lines (Update, Add, Delete)
            match = re.match(r"\*\*\* (Update|Add|Delete) File: (.*)", line)
            if match:
                if current_action:
                    edits.append(current_action) # Save previous action
                action_type_str, path = match.groups()
                action_type = ActionType(action_type_str)
                path = path.strip()
                current_action = PatchAction(type=action_type, path=path)
                # Check for optional Move to line immediately after Update
                if action_type == ActionType.UPDATE and i < len(lines):
                    move_match = re.match(r"\*\*\* Move to: (.*)", lines[i])
                    if move_match:
                        current_action.move_path = move_match.group(1).strip()
                        i += 1 # Consume the move line
                continue
            if not current_action:
                # Skip lines before the first action inside the patch
                continue
            # Handle content for Add action
            if current_action.type == ActionType.ADD:
                if current_action.new_content is None:
                    current_action.new_content = ""
                # Assuming ADD content starts immediately and uses '+' prefix
                if line.startswith("+"):
                    current_action.new_content += line[1:] + "\n"
                else:
                    # Or maybe ADD content is just raw lines until next ***?
                    # This part needs clarification based on exact format spec.
                    # Assuming '+' prefix for now. If not, adjust logic.
                    pass # Ignore lines not starting with '+' in ADD? Or raise error?
                continue
            # Handle chunks for Update action
            if current_action.type == ActionType.UPDATE:
                # This simplified parser doesn't handle @@ context or chunk boundaries well.
                # It assumes a simple sequence of context, '-', '+' lines per chunk.
                # A real implementation needs the state machine from apply_patch.py's peek_next_section.
                # Placeholder: treat consecutive -,+ blocks as single chunk for simplicity.
                if not current_action.chunks:
                     current_action.chunks.append(Chunk()) # Start first chunk
                chunk = current_action.chunks[-1]
                if line.startswith("-"):
                    chunk.del_lines.append(line[1:])
                elif line.startswith("+"):
                    chunk.ins_lines.append(line[1:])
                elif line.startswith("@@"):
                    # Context line - ignored by this simplified parser
                    pass
                elif line.strip() == "*** End of File":
                    # EOF marker - ignored by this simplified parser
                    pass
                else:
                    # Assume it's context line if not +/-/@@
                    # This simplified parser doesn't store context properly.
                    pass
                continue
        if in_patch and not current_action:
             # Started patch but no actions found before end?
             pass # Or raise error?
        if in_patch and current_action:
             # Reached end of content without *** End Patch
             edits.append(current_action) # Append the last action
             # Consider raising a warning or error about missing End Patch sentinel
        return edits
    def apply_edits(self, edits: List[PatchAction]):
        """
        Applies the parsed PatchActions to the corresponding files.
        """
        if not edits:
            return
        for action in edits:
            full_path = self.abs_root_path(action.path)
            path_obj = pathlib.Path(full_path)
            try:
                if action.type == ActionType.ADD:
                    if path_obj.exists():
                        # According to apply_patch.py, Add should fail if file exists.
                        # This check should ideally happen during parsing with file content access.
                        raise ValueError(f"ADD Error: File already exists: {action.path}")
                    if action.new_content is None:
                        raise ValueError(f"ADD change for {action.path} has no content")
                    # Ensure parent directory exists
                    path_obj.parent.mkdir(parents=True, exist_ok=True)
                    self.io.write_text(full_path, action.new_content.rstrip('\n') + '\n') # Ensure single trailing newline
                elif action.type == ActionType.DELETE:
                    if not path_obj.exists():
                         # Allow deleting non-existent files (idempotent)
                         pass
                    else:
                        path_obj.unlink()
                elif action.type == ActionType.UPDATE:
                    if not path_obj.exists():
                        # Update should fail if file doesn't exist (checked in apply_patch.py parser)
                        raise ValueError(f"UPDATE Error: File does not exist: {action.path}")
                    current_content = self.io.read_text(full_path)
                    if current_content is None:
                        raise ValueError(f"Could not read file for UPDATE: {action.path}")
                    # Apply the update logic using the parsed chunks
                    new_content = self._apply_update(current_content, action.chunks, action.path)
                    target_full_path = self.abs_root_path(action.move_path) if action.move_path else full_path
                    target_path_obj = pathlib.Path(target_full_path)
                    # Ensure parent directory exists for target
                    target_path_obj.parent.mkdir(parents=True, exist_ok=True)
                    self.io.write_text(target_full_path, new_content)
                    if action.move_path and full_path != target_full_path:
                        # Remove original file after successful write to new location
                        path_obj.unlink()
                else:
                    raise ValueError(f"Unknown action type encountered: {action.type}")
            except Exception as e:
                # Raise a ValueError to signal failure, consistent with other coders.
                raise ValueError(f"Error applying action '{action.type}' to {action.path}: {e}")
    def _apply_update(self, text: str, chunks: List[Chunk], path: str) -> str:
        """
        Applies UPDATE chunks to the given text content.
        Requires accurate chunk information (indices, lines) from a robust parser.
        This simplified version assumes chunks are sequential and indices are correct.
        """
        if not chunks:
            return text # No changes specified
        orig_lines = text.splitlines() # Use splitlines() to match apply_patch.py behavior
        dest_lines = []
        last_orig_line_idx = -1 # Track the end of the last applied chunk in original lines
        # apply_patch.py finds context during parsing. Here we assume indices are pre-validated.
        # A robust implementation would re-validate context here or rely entirely on parser validation.
        # Sort chunks? apply_patch.py implies they are processed in order found in patch.
        # Chunks need accurate `orig_index` relative to the start of their *context* block.
        # This simplified implementation lacks proper context handling and index calculation.
        # It assumes `orig_index` is the absolute line number from start of file, which is incorrect
        # based on apply_patch.py.
        # --> THIS METHOD NEEDS REWRITING BASED ON A CORRECT PARSER <--
        # For demonstration, let's process sequentially, assuming indices are somewhat meaningful.
        current_orig_line_num = 0
        for chunk in chunks:
            # Placeholder: Assume chunk application logic here.
            # This needs the sophisticated context matching and index handling from apply_patch.py.
            # The current simplified parser doesn't provide enough info (like validated indices).
            # Raising NotImplementedError until a proper parser/applier is integrated.
            raise NotImplementedError(
                "_apply_update requires a robust parser and context handling, similar to apply_patch.py"
            )
            # --- Hypothetical logic assuming correct indices ---
            # chunk_start_index = chunk.orig_index # Needs correct calculation based on context
            # if chunk_start_index < current_orig_line_num:
            #     raise ValueError(f"{path}: Overlapping or out-of-order chunk detected.")
            #
            # # Add lines between the last chunk and this one
            # dest_lines.extend(orig_lines[current_orig_line_num:chunk_start_index])
            #
            # # Verify deleted lines match (requires normalization)
            # num_del = len(chunk.del_lines)
            # actual_deleted = orig_lines[chunk_start_index : chunk_start_index + num_del]
            # # if normalized(actual_deleted) != normalized(chunk.del_lines):
            # #    raise ValueError(f"{path}: Mismatch in deleted lines for chunk at index {chunk_start_index}")
            #
            # # Add inserted lines
            # dest_lines.extend(chunk.ins_lines)
            #
            # # Advance index past the deleted lines
            # current_orig_line_num = chunk_start_index + num_del
            # --- End Hypothetical ---
        # Add remaining lines after the last chunk
        dest_lines.extend(orig_lines[current_orig_line_num:])
        return "\n".join(dest_lines) + "\n" # Ensure trailing newline