From 73cb2f8fa520ec8fb4e03d6ef51261372ca77a70 Mon Sep 17 00:00:00 2001
From: Ettore Di Giacinto <mudler@localai.io>
Date: Thu, 15 May 2025 23:17:08 +0200
Subject: [PATCH] Reset auto detected template

Signed-off-by: Ettore Di Giacinto <mudler@localai.io>
---
 backend/cpp/llama/grpc-server.cpp | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/backend/cpp/llama/grpc-server.cpp b/backend/cpp/llama/grpc-server.cpp
index e688a7fa..d4845903 100644
--- a/backend/cpp/llama/grpc-server.cpp
+++ b/backend/cpp/llama/grpc-server.cpp
@@ -3587,6 +3587,10 @@ static void start_llama_server(server_context& ctx_server) {
         common_chat_templates_source(ctx_server.chat_templates.get()),
         common_chat_format_example(ctx_server.chat_templates.get(), ctx_server.params_base.use_jinja).c_str());
 
+    // Reset the chat templates
+    // TODO: We should make this configurable by respecting the option that is already present in LocalAI for vLLM
+    ctx_server.chat_templates.reset();
+
     ctx_server.queue_tasks.on_new_task([&ctx_server](server_task && task) {
         ctx_server.process_single_task(std::move(task));
     });