diff --git a/benchmark/over_time.py b/benchmark/over_time.py
index c74593499..1a374f962 100644
--- a/benchmark/over_time.py
+++ b/benchmark/over_time.py
@@ -26,7 +26,7 @@ def plot_over_time(yaml_file):
     fig, ax = plt.subplots(figsize=(10, 4))
     ax.grid(axis="y", zorder=0, lw=0.2)
     colors = ['red' if 'gpt-4' in model else 'green' if 'gpt-3.5' in model else 'blue' for model in models]
-    ax.scatter(dates, pass_rates, c=colors, alpha=0.5)
+    ax.scatter(dates, pass_rates, c=colors, alpha=0.5, s=100)
 
     for i, model in enumerate(models):
         ax.annotate(model, (dates[i], pass_rates[i]), fontsize=12, alpha=0.75,