mirror of
https://github.com/mudler/LocalAI.git
synced 2026-05-17 13:10:23 -04:00
* feat: Rework VRAM estimation and use known_usecases in gallery Signed-off-by: Richard Palethorpe <io@richiejp.com> Assisted-by: Claude:claude-opus-4-7[1m] [Claude Code] * chore(gallery): regenerate gallery index and add known_usecases to model entries Signed-off-by: Richard Palethorpe <io@richiejp.com> --------- Signed-off-by: Richard Palethorpe <io@richiejp.com>
25 lines
705 B
YAML
25 lines
705 B
YAML
config_file: |
|
||
backend: llama-cpp
|
||
context_size: 131072
|
||
f16: true
|
||
known_usecases:
|
||
- chat
|
||
mmap: true
|
||
stopwords:
|
||
- <|begin▁of▁sentence|>
|
||
- <|end▁of▁sentence|>
|
||
- <|User|>
|
||
- <|Assistant|>
|
||
template:
|
||
chat: |
|
||
{{.Input -}}<|Assistant|>
|
||
chat_message: |
|
||
{{if eq .RoleName "system" -}}{{.Content }}
|
||
{{ end -}}
|
||
{{if eq .RoleName "user" -}}<|User|>{{.Content}}
|
||
{{end -}}
|
||
{{if eq .RoleName "assistant" -}}<|Assistant|>{{.Content}}<|end▁of▁sentence|>{{end}}
|
||
completion: |
|
||
{{.Input}}
|
||
name: deepseek-r1
|