mirror of
https://github.com/mudler/LocalAI.git
synced 2025-06-29 22:20:43 +00:00
Do not always try to load the tokenizer
Signed-off-by: Ettore Di Giacinto <mudler@localai.io>
This commit is contained in:
parent
0abb5f05be
commit
f536038f65
1 changed files with 5 additions and 1 deletions
|
@ -95,6 +95,7 @@ class BackendServicer(backend_pb2_grpc.BackendServicer):
|
||||||
device_map="cpu"
|
device_map="cpu"
|
||||||
|
|
||||||
quantization = None
|
quantization = None
|
||||||
|
autoTokenizer = True
|
||||||
|
|
||||||
if self.CUDA:
|
if self.CUDA:
|
||||||
from transformers import BitsAndBytesConfig, AutoModelForCausalLM
|
from transformers import BitsAndBytesConfig, AutoModelForCausalLM
|
||||||
|
@ -198,9 +199,11 @@ class BackendServicer(backend_pb2_grpc.BackendServicer):
|
||||||
device=device_map)
|
device=device_map)
|
||||||
self.OV = True
|
self.OV = True
|
||||||
elif request.Type == "MusicgenForConditionalGeneration":
|
elif request.Type == "MusicgenForConditionalGeneration":
|
||||||
|
autoTokenizer = False
|
||||||
self.processor = AutoProcessor.from_pretrained(model_name)
|
self.processor = AutoProcessor.from_pretrained(model_name)
|
||||||
self.model = MusicgenForConditionalGeneration.from_pretrained(model_name)
|
self.model = MusicgenForConditionalGeneration.from_pretrained(model_name)
|
||||||
elif request.Type == "OuteTTS":
|
elif request.Type == "OuteTTS":
|
||||||
|
autoTokenizer = False
|
||||||
options = request.Options
|
options = request.Options
|
||||||
MODELNAME = "OuteAI/OuteTTS-0.3-1B"
|
MODELNAME = "OuteAI/OuteTTS-0.3-1B"
|
||||||
TOKENIZER = "OuteAI/OuteTTS-0.3-1B"
|
TOKENIZER = "OuteAI/OuteTTS-0.3-1B"
|
||||||
|
@ -239,6 +242,7 @@ class BackendServicer(backend_pb2_grpc.BackendServicer):
|
||||||
else:
|
else:
|
||||||
self.speaker = self.interface.load_default_speaker(name=SPEAKER)
|
self.speaker = self.interface.load_default_speaker(name=SPEAKER)
|
||||||
elif request.Type == "SentenceTransformer":
|
elif request.Type == "SentenceTransformer":
|
||||||
|
autoTokenizer = False
|
||||||
self.model = SentenceTransformer(model_name, trust_remote_code=request.TrustRemoteCode)
|
self.model = SentenceTransformer(model_name, trust_remote_code=request.TrustRemoteCode)
|
||||||
self.SentenceTransformer = True
|
self.SentenceTransformer = True
|
||||||
else:
|
else:
|
||||||
|
@ -256,7 +260,7 @@ class BackendServicer(backend_pb2_grpc.BackendServicer):
|
||||||
else:
|
else:
|
||||||
self.max_tokens = 512
|
self.max_tokens = 512
|
||||||
|
|
||||||
if request.Type != "MusicgenForConditionalGeneration":
|
if autoTokenizer:
|
||||||
self.tokenizer = AutoTokenizer.from_pretrained(model_name, use_safetensors=True)
|
self.tokenizer = AutoTokenizer.from_pretrained(model_name, use_safetensors=True)
|
||||||
self.XPU = False
|
self.XPU = False
|
||||||
|
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue