diff --git a/aider/website/_includes/quant-chart.js b/aider/website/_includes/quant-chart.js new file mode 100644 index 000000000..9ae95160c --- /dev/null +++ b/aider/website/_includes/quant-chart.js @@ -0,0 +1,38 @@ +document.addEventListener('DOMContentLoaded', function () { + var ctx = document.getElementById('quantChart').getContext('2d'); + var chartData = { + labels: [], + datasets: [{ + label: 'Percent completed correctly', + data: [], + backgroundColor: 'rgba(54, 162, 235, 0.2)', + borderColor: 'rgba(54, 162, 235, 1)', + borderWidth: 1 + }] + }; + + var allData = []; + {% for row in site.data.quant %} + allData.push({ + model: '{{ row.model }}', + pass_rate_2: {{ row.pass_rate_2 }} + }); + {% endfor %} + + allData.forEach(function(row) { + chartData.labels.push(row.model); + chartData.datasets[0].data.push(row.pass_rate_2); + }); + + new Chart(ctx, { + type: 'bar', + data: chartData, + options: { + scales: { + y: { + beginAtZero: true + } + } + } + }); +}); diff --git a/aider/website/_posts/2024-11-21-quantization.md b/aider/website/_posts/2024-11-21-quantization.md index 0a2382d82..a3fd656fb 100644 --- a/aider/website/_posts/2024-11-21-quantization.md +++ b/aider/website/_posts/2024-11-21-quantization.md @@ -21,7 +21,8 @@ and local model servers like ollama. The graph below compares 4 different versions of the Qwen 2.5 32B model, served both locally and from cloud providers: -- Qwen2.5-Coder-32B-Instruct -- ollama/qwen2.5:32b -- ollama/qwen2.5:32b-instruct-q8_0 -- openrouter/qwen/qwen-2.5-coder-32b-instruct + + +