aider/benchmark/rungrid.py
2023-07-01 06:21:50 -07:00

39 lines
813 B
Python
Executable file

#!/usr/bin/env python
import sys
from aider.dump import dump
from benchmark import main as benchmark_main
def main():
models = [
"gpt-3.5-turbo-0301",
"gpt-3.5-turbo-0613",
"gpt-3.5-turbo-16k-0613",
]
edit_formats = [
"diff",
"diff-func",
"whole",
"whole-func",
]
for model in models:
for edit_format in edit_formats:
# dump(model, edit_format)
dirname = f"/benchmarks/rungrid-{model}-{edit_format}"
dump(dirname)
benchmark_main(
dirnames=[dirname],
model=model,
edit_format=edit_format,
threads=10,
cont=True,
)
if __name__ == "__main__":
status = main()
sys.exit(status)