From fade34394cf048fb46fa455d73994d2ae1016f8f Mon Sep 17 00:00:00 2001 From: TheDropZone Date: Mon, 17 Feb 2025 16:25:24 -0500 Subject: [PATCH] using " marks in the config.yaml file Signed-off-by: TheDropZone --- gallery/vllm.yaml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/gallery/vllm.yaml b/gallery/vllm.yaml index b97f48d5..f0b797cc 100644 --- a/gallery/vllm.yaml +++ b/gallery/vllm.yaml @@ -16,8 +16,8 @@ config_file: | use_tokenizer_template: true # Uncomment to specify a quantization method (optional) # quantization: "awq" - # Uncomment to set dtype, choices are: 'auto', 'half', 'float16', 'bfloat16', 'float', 'float32'. awq on vLLM does not support bfloat16 - # dtype: 'float16' + # Uncomment to set dtype, choices are: "auto", "half", "float16", "bfloat16", "float", "float32". awq on vLLM does not support bfloat16 + # dtype: "float16" # Uncomment to limit the GPU memory utilization (vLLM default is 0.9 for 90%) # gpu_memory_utilization: 0.5 # Uncomment to trust remote code from huggingface