mirror of
https://github.com/Aider-AI/aider.git
synced 2025-05-20 12:24:59 +00:00
53 lines
1.1 KiB
Python
Executable file
53 lines
1.1 KiB
Python
Executable file
#!/usr/bin/env python
|
|
|
|
import subprocess
|
|
import sys
|
|
|
|
from aider.dump import dump # noqa: F401
|
|
|
|
|
|
def main():
|
|
models = [
|
|
"gpt-3.5-turbo-0301",
|
|
"gpt-3.5-turbo-0613",
|
|
"gpt-3.5-turbo-16k-0613",
|
|
]
|
|
edit_formats = [
|
|
"diff",
|
|
"diff-func",
|
|
"whole",
|
|
"whole-func",
|
|
]
|
|
|
|
for model in models:
|
|
for edit_format in edit_formats:
|
|
# dump(model, edit_format)
|
|
|
|
if "-func" in edit_format and "-03" in model:
|
|
continue
|
|
|
|
if (model, edit_format) == ("gpt-3.5-turbo-16k-0613", "whole-func"):
|
|
# sublist reliably hangs the API?
|
|
continue
|
|
|
|
dirname = f"rungrid-{model}-{edit_format}"
|
|
|
|
cmd = [
|
|
"./benchmark/benchmark.py",
|
|
dirname,
|
|
"--model",
|
|
model,
|
|
"--edit-format",
|
|
edit_format,
|
|
"--threads",
|
|
"10",
|
|
"--cont",
|
|
]
|
|
print(" ".join(cmd))
|
|
|
|
subprocess.run(cmd, check=True)
|
|
|
|
|
|
if __name__ == "__main__":
|
|
status = main()
|
|
sys.exit(status)
|