diff --git a/assets/swe_bench_lite.jpg b/assets/swe_bench_lite.jpg index d7455765e..6d6d3e807 100644 Binary files a/assets/swe_bench_lite.jpg and b/assets/swe_bench_lite.jpg differ diff --git a/assets/swe_bench_lite.svg b/assets/swe_bench_lite.svg index 9affe1f65..419998794 100644 --- a/assets/swe_bench_lite.svg +++ b/assets/swe_bench_lite.svg @@ -6,7 +6,7 @@ - 2024-05-23T08:28:16.091496 + 2024-05-23T09:49:41.227630 image/svg+xml @@ -41,12 +41,12 @@ z - - + @@ -453,7 +453,7 @@ z - + @@ -479,7 +479,7 @@ z - + @@ -601,7 +601,7 @@ z - + @@ -674,7 +674,7 @@ z - + @@ -886,7 +886,7 @@ z - + @@ -1007,7 +1007,7 @@ z - + @@ -1043,16 +1043,16 @@ z +" clip-path="url(#p3efb973a07)" style="fill: none; stroke: #b0b0b0; stroke-width: 0.2; stroke-linecap: square"/> - - + @@ -1089,11 +1089,11 @@ z +" clip-path="url(#p3efb973a07)" style="fill: none; stroke: #b0b0b0; stroke-width: 0.2; stroke-linecap: square"/> - + @@ -1135,11 +1135,11 @@ z +" clip-path="url(#p3efb973a07)" style="fill: none; stroke: #b0b0b0; stroke-width: 0.2; stroke-linecap: square"/> - + @@ -1167,11 +1167,11 @@ z +" clip-path="url(#p3efb973a07)" style="fill: none; stroke: #b0b0b0; stroke-width: 0.2; stroke-linecap: square"/> - + @@ -1186,11 +1186,11 @@ L 690 161.676713 +" clip-path="url(#p3efb973a07)" style="fill: none; stroke: #b0b0b0; stroke-width: 0.2; stroke-linecap: square"/> - + @@ -1232,11 +1232,11 @@ z +" clip-path="url(#p3efb973a07)" style="fill: none; stroke: #b0b0b0; stroke-width: 0.2; stroke-linecap: square"/> - + @@ -1411,7 +1411,7 @@ L 163.368917 273.70025 L 163.368917 77.285649 L 96.917045 77.285649 z -" clip-path="url(#p009365f358)" style="fill: #b3e6a8; opacity: 0.75"/> +" clip-path="url(#p3efb973a07)" style="fill: #b3e6a8; opacity: 0.9"/> +" clip-path="url(#p3efb973a07)" style="fill: #b3e6a8; opacity: 0.9"/> +" clip-path="url(#p3efb973a07)" style="fill: #b3d1e6; opacity: 0.3"/> +" clip-path="url(#p3efb973a07)" style="fill: #b3d1e6; opacity: 0.3"/> +" clip-path="url(#p3efb973a07)" style="fill: #b3d1e6; opacity: 0.3"/> +" clip-path="url(#p3efb973a07)" style="fill: #b3d1e6; opacity: 0.3"/> +" clip-path="url(#p3efb973a07)" style="fill: #b3d1e6; opacity: 0.3"/> @@ -1745,7 +1745,7 @@ z - + diff --git a/benchmark/swe_bench_lite.py b/benchmark/swe_bench_lite.py index c940b4bba..b8949abfa 100644 --- a/benchmark/swe_bench_lite.py +++ b/benchmark/swe_bench_lite.py @@ -34,7 +34,7 @@ def plot_swe_bench_lite(data_file): colors = ["#b3e6a8" if "Aider" in model else "#b3d1e6" for model in models] bars = [] for model, pass_rate, color in zip(models, pass_rates, colors): - alpha = 0.9 if "Aider" in model else 0.5 + alpha = 0.9 if "Aider" in model else 0.3 bar = ax.bar(model, pass_rate, color=color, alpha=alpha, zorder=3) bars.append(bar[0])