mirror of
https://github.com/mudler/LocalAI.git
synced 2025-05-20 10:35:01 +00:00
feat(vllm): expose 'load_format' (#3943)
Signed-off-by: Ettore Di Giacinto <mudler@localai.io>
This commit is contained in:
parent
c75ecfa009
commit
ae1ec4e096
3 changed files with 4 additions and 0 deletions
|
@ -95,6 +95,8 @@ class BackendServicer(backend_pb2_grpc.BackendServicer):
|
|||
|
||||
if request.Quantization != "":
|
||||
engine_args.quantization = request.Quantization
|
||||
if request.LoadFormat != "":
|
||||
engine_args.load_format = request.LoadFormat
|
||||
if request.GPUMemoryUtilization != 0:
|
||||
engine_args.gpu_memory_utilization = request.GPUMemoryUtilization
|
||||
if request.TrustRemoteCode:
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue