#!/usr/bin/env python # This is a Python script that uses OpenAI's GPT-3 to modify code based on user requests. import os import sys import copy import random import json import re import readline import traceback import argparse from tqdm import tqdm from pathlib import Path from collections import defaultdict from pygments import highlight, lexers, formatters import os import openai from dump import dump import prompts history_file = '.coder.history' try: readline.read_history_file(history_file) except FileNotFoundError: pass formatter = formatters.TerminalFormatter() openai.api_key = os.getenv("OPENAI_API_KEY") def find_index(list1, list2): for i in range(len(list1)): if list1[i:i+len(list2)] == list2: return i return -1 class Coder: fnames = dict() last_modified = 0 def __init__(self, use_gpt_4): if use_gpt_4: self.main_model = 'gpt-4' else: self.main_model = 'gpt-3.5-turbo' def add_file(self, fname): self.fnames[fname] = Path(fname).stat().st_mtime def files_modified(self): for fname,mtime in self.fnames.items(): if Path(fname).stat().st_mtime != mtime: return True def request(self, prompt): self.request_prompt = prompt def quoted_file(self, fname): prompt = '\n' prompt += fname prompt += '\n```\n' prompt += Path(fname).read_text() prompt += '\n```\n' return prompt def get_files_content(self): prompt = '' for fname in self.fnames: prompt += self.quoted_file(fname) return prompt def get_input(self): print() print('='*60) inp = '' num_control_c = 0 while not inp.strip(): try: inp = input('> ') except EOFError: return except KeyboardInterrupt: num_control_c += 1 print() if num_control_c >= 2: return print('^C again to quit') print() readline.write_history_file(history_file) return inp def set_files_messages(self, did_edits = False): last_modified = max(Path(fname).stat().st_mtime for fname in self.fnames) if last_modified <= self.last_modified: return did_edits = (self.last_modified > 0) self.last_modified = last_modified print('Reloading files...') if did_edits: files_content = prompts.files_content_prefix_edited else: files_content = prompts.files_content_prefix_plain files_content += self.get_files_content() files_content += prompts.files_content_suffix self.files_messages = [ dict(role = 'user', content = files_content), dict(role = 'assistant', content = "Ok."), ] return True def run(self): self.done_messages = [] self.cur_messages = [] self.set_files_messages() while True: inp = self.get_input() if inp is None: return if self.set_files_messages(): # files changed, move cur messages back behind the files messages self.done_messages += self.cur_messages self.cur_messages = [] self.cur_messages += [ dict(role = 'user', content = inp), ] #self.show_messages(self.done_messages, "done") #self.show_messages(self.files_messages, "files") #self.show_messages(self.cur_messages, "cur") messages = [ dict(role = 'system', content = prompts.main_system), ] messages += self.done_messages messages += self.files_messages messages += self.cur_messages self.show_messages(messages, 'all') content = self.send(messages) self.cur_messages += [ dict(role = 'assistant', content = content), ] print() print() try: edited = self.update_files(content, inp) except Exception as err: print(err) print() traceback.print_exc() edited = None if not edited: continue self.set_files_messages(True) self.done_messages += self.cur_messages self.cur_messages = [] def show_messages(self, messages, title): print(title.upper(), '*' * 50) for msg in messages: print() print('-' * 50) role = msg['role'].upper() content = msg['content'].splitlines() for line in content: print(role, line) def send(self, messages, model=None, show_progress = 0): #self.show_messages(messages, "all") if not model: model = self.main_model completion = openai.ChatCompletion.create( model=model, messages=messages, temperature=0, stream = True, ) if show_progress: return self.show_send_progress(completion, show_progress) else: return self.show_send_output_plain(completion) def show_send_progress(self, completion, show_progress): resp = [] pbar = tqdm(total = show_progress) for chunk in completion: try: text = chunk.choices[0].delta.content resp.append(text) except AttributeError: continue pbar.update(len(text)) pbar.update(show_progress) pbar.close() resp = ''.join(resp) return resp def show_send_output_plain(self, completion): resp = '' in_diff = False diff_lines = [] partial_line = '' for chunk in completion: if chunk.choices[0].finish_reason not in (None, 'stop'): dump(chunk.choices[0].finish_reason) try: text = chunk.choices[0].delta.content resp += text except AttributeError: continue sys.stdout.write(text) sys.stdout.flush() # disabled if False and '```' in resp: return resp return resp def show_send_output_color(self, completion): resp = [] in_diff = False diff_lines = [] def print_lines(): if not diff_lines: return code = '\n'.join(diff_lines) lexer = lexers.guess_lexer(code) code = highlight(code, lexer, formatter) print(code, end='') partial_line = '' for chunk in completion: try: text = chunk.choices[0].delta.content resp.append(text) except AttributeError: continue lines = (partial_line + text) lines = lines.split('\n') partial_line = lines.pop() for line in lines: check = line.rstrip() if check == '>>>>>>> UPDATED': print_lines() in_diff = False diff_lines = [] if check == '=======': print_lines() diff_lines = [] print(line) elif in_diff: diff_lines.append(line) else: print(line) if line.strip() == '<<<<<<< ORIGINAL': in_diff = True diff_lines = [] print_lines() if partial_line: print(partial_line) return ''.join(resp) pattern = re.compile(r'(\S+)\s+(```)?<<<<<<< ORIGINAL\n(.*?\n?)=======\n(.*?\n?)>>>>>>> UPDATED', re.MULTILINE | re.DOTALL) def update_files(self, content, inp): edited = set() for match in self.pattern.finditer(content): path, _, original, updated = match.groups() edited.add(path) if self.do_replace(path, original, updated): continue edit = match.group() self.do_gpt_powered_replace(path, edit, inp) return edited def do_replace(self, fname, before_text, after_text): before_text = self.strip_quoted_wrapping(before_text, fname) after_text = self.strip_quoted_wrapping(after_text, fname) fname = Path(fname) # does it want to make a new file? if not fname.exists() and not before_text: print('Creating empty file:', fname) fname.touch() content = fname.read_text().splitlines() if not before_text and not content: # first populating an empty file new_content = after_text else: before_lines = [l.strip() for l in before_text.splitlines()] stripped_content = [l.strip() for l in content] where = find_index(stripped_content, before_lines) if where < 0: return new_content = content[:where] new_content += after_text.splitlines() new_content += content[where+len(before_lines):] new_content = '\n'.join(new_content) + '\n' fname.write_text(new_content) print('Applied edit to', fname) return True def do_gpt_powered_replace(self, fname, edit, request): model = 'gpt-3.5-turbo' print(f'Asking {model} to apply ambiguous edit to {fname}...') fname = Path(fname) content = fname.read_text() prompt = prompts.editor_user.format( request = request, edit = edit, fname = fname, content = content, ) messages = [ dict(role = 'system', content = prompts.editor_system), dict(role = 'user', content = prompt), ] res = self.send(messages, show_progress = len(content) + len(edit)/2, model=model) res = self.strip_quoted_wrapping(res, fname) fname.write_text(res) def strip_quoted_wrapping(self, res, fname=None): if not res: return res res = res.splitlines() if fname and res[0].strip().endswith(Path(fname).name): res = res[1:] if res[0].startswith('```') and res[-1].startswith('```'): res = res[1:-1] res = '\n'.join(res) if res and res[-1] != '\n': res += '\n' return res def main(): parser = argparse.ArgumentParser(description='Chat with GPT about code') parser.add_argument('files', metavar='FILE', nargs='+', help='a list of source code files') parser.add_argument('-3', '--gpt-3-5-turbo', action='store_true', help='Only use gpt-3.5-turbo, not gpt-4') args = parser.parse_args() use_gpt_4 = not args.gpt_3_5_turbo coder = Coder(use_gpt_4) fnames = args.files for fname in fnames: coder.add_file(fname) coder.run() if __name__ == '__main__': status = main() sys.exit(status)