mirror of
https://github.com/mudler/LocalAI.git
synced 2025-05-28 06:25:00 +00:00
feat: update llama, enable NUMA (#684)
This commit is contained in:
parent
e130b208ab
commit
3593cb0c87
3 changed files with 6 additions and 1 deletions
|
@ -23,6 +23,7 @@ type Config struct {
|
|||
TrimSpace []string `yaml:"trimspace"`
|
||||
ContextSize int `yaml:"context_size"`
|
||||
F16 bool `yaml:"f16"`
|
||||
NUMA bool `yaml:"numa"`
|
||||
Threads int `yaml:"threads"`
|
||||
Debug bool `yaml:"debug"`
|
||||
Roles map[string]string `yaml:"roles"`
|
||||
|
|
|
@ -48,6 +48,10 @@ func defaultLLamaOpts(c Config) []llama.ModelOption {
|
|||
llamaOpts = append(llamaOpts, llama.SetNBatch(512))
|
||||
}
|
||||
|
||||
if c.NUMA {
|
||||
llamaOpts = append(llamaOpts, llama.EnableNUMA)
|
||||
}
|
||||
|
||||
if c.LowVRAM {
|
||||
llamaOpts = append(llamaOpts, llama.EnabelLowVRAM)
|
||||
}
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue