feat(vllm): Allow to set quantization (#1094)

This particularly useful to set AWQ **Description** Follow up of #1015 **Notes for Reviewers** **[Signed commits](../CONTRIBUTING.md#signing-off-on-commits-developer-certificate-of-origin)** - [ ] Yes, I signed my commits.  --------- Signed-off-by: Ettore Di Giacinto <mudler@localai.io>
2025-05-20 10:35:01 +00:00 · 2023-09-22 15:52:38 +02:00 · 2023-09-22 15:52:38 +02:00 · a28ab18987
commit a28ab18987
parent 048b81373d
13 changed files with 357 additions and 332 deletions
--- a/api/backend/options.go
+++ b/api/backend/options.go
@ -44,6 +44,7 @@ func gRPCModelOpts(c config.Config) *pb.ModelOptions {
 		NoMulMatQ:     c.NoMulMatQ,
 		DraftModel:    c.DraftModel,
 		AudioPath:     c.VallE.AudioPath,
+		Quantization:  c.Quantization,
 		LoraAdapter:   c.LoraAdapter,
 		LoraBase:      c.LoraBase,
 		NGQA:          c.NGQA,