diff --git a/benchmark/swe_bench_lite.py b/benchmark/swe_bench_lite.py index b719a6ab8..023f50d5f 100644 --- a/benchmark/swe_bench_lite.py +++ b/benchmark/swe_bench_lite.py @@ -1,8 +1,10 @@ +import sys +from pathlib import Path + import matplotlib.pyplot as plt from imgcat import imgcat from matplotlib import rc -import sys -from pathlib import Path + def plot_swe_bench_lite(data_file): with open(data_file, "r") as file: @@ -32,7 +34,7 @@ def plot_swe_bench_lite(data_file): rc("font", **font_params) plt.rcParams["text.color"] = font_color - fig, ax = plt.subplots(figsize=(10, 5)) + fig, ax = plt.subplots(figsize=(10, 6)) ax.grid(axis="y", zorder=0, lw=0.2) for spine in ax.spines.values(): spine.set_edgecolor("#DDDDDD") @@ -43,7 +45,7 @@ def plot_swe_bench_lite(data_file): for model, pass_rate, color in zip(models, pass_rates, colors): alpha = 0.9 if "Aider" in model else 0.3 hatch = "" - #if "lite" not in data_file: + # if "lite" not in data_file: # hatch = "///" if "(570)" in model else "" bar = ax.bar(model, pass_rate, color=color, alpha=alpha, zorder=3, hatch=hatch) bars.append(bar[0]) @@ -78,19 +80,21 @@ def plot_swe_bench_lite(data_file): color=font_color, ) - # Add note at the bottom of the graph - note = "Note: (570) and (2294) refer to the number of instances that were processed by the agent." + note = ( + "Note: (570) and (2294) refer to the number of SWE Bench instances that were benchmarked." + ) plt.figtext( - 0.5, 0.025, + 0.5, + 0.025, note, wrap=True, - horizontalalignment='center', + horizontalalignment="center", fontsize=12, color=font_color, ) - plt.tight_layout(pad=5.0) + plt.tight_layout(pad=3.0) out_fname = Path(data_file) plt.savefig(out_fname.with_suffix(".jpg").name)