diff --git a/benchmark/over_time.py b/benchmark/over_time.py index c74593499..1a374f962 100644 --- a/benchmark/over_time.py +++ b/benchmark/over_time.py @@ -26,7 +26,7 @@ def plot_over_time(yaml_file): fig, ax = plt.subplots(figsize=(10, 4)) ax.grid(axis="y", zorder=0, lw=0.2) colors = ['red' if 'gpt-4' in model else 'green' if 'gpt-3.5' in model else 'blue' for model in models] - ax.scatter(dates, pass_rates, c=colors, alpha=0.5) + ax.scatter(dates, pass_rates, c=colors, alpha=0.5, s=100) for i, model in enumerate(models): ax.annotate(model, (dates[i], pass_rates[i]), fontsize=12, alpha=0.75,