Files
LocalAI/core/services/modeladmin/config.go
Richard Palethorpe 3fa7b2955c feat(pii): NER tier engine — privacy-filter.cpp backend + NER-centric PII filter (#10360)
Squashed feat/pii-ner-tier-engine rebased onto master (was 45 commits; see
backup/pii-ner-tier-engine-prerebase). Net change:

- privacy-filter.cpp: standalone GGML engine for the openai-privacy-filter
  PII/NER token classifier, wired as a LocalAI gRPC backend (CPU/CUDA/Vulkan).
  TokenClassify moves off the patched llama.cpp path onto this backend.
- PII filter reworked to be NER-centric (encoder/NER detection tier scanning
  whole conversations as one document), with a recreated bounded restricted-
  regex secret-matching pattern detector tier alongside it (per-model
  pii_detection.builtins / .patterns + core/services/routing/piipattern).
- Detection labelled by source (ner vs pattern); backend trace / confidence /
  debug observability; analyze/redact exposed as a synchronous API.
- Instance-wide default detector policy + per-usecase default-on; request
  filtering extended to completions, embeddings, edits & Ollama.
- React UI: NER-centric PII editor, detector-models table, pattern/builtins
  editor, middleware default-policy UI.
- Gallery: privacy-filter-multilingual token-classify model + NER install
  filter; token_classify known_usecase; batch sized to context for NER models.
  privacy-filter backend registered in the backend gallery (cpu/vulkan/cuda-13
  meta + image entries with a capabilities map) matching its CI matrix jobs,
  and an /import-model auto-detect importer (PrivacyFilterImporter, narrow
  privacy-filter GGUF detection) replacing the prior pref-only registration.

Reconciled against master's independent evolution:

- Dropped master's PIIPatternOverrides feature (global-pattern runtime
  overrides + /api/pii/patterns API + runtime_settings.json persistence). The
  per-model NER + pattern-detector design supersedes it; it was built on the
  global redactor pattern set this branch replaced.
- Reverted the llama.cpp Score carry-patch (0006-server-task-type-score):
  removed the patch and restored master's grpc-server.cpp Score RPC (direct
  llama_decode, slot-loop bypass) and LLAMA_VERSION pin, plus master's
  model_config validation forbidding score + chat/completion/embeddings on
  llama-cpp. token_classify is unaffected (it runs on the privacy-filter
  backend, not llama-cpp).

Assisted-by: Claude:claude-opus-4-8 [Claude Code]

Signed-off-by: Richard Palethorpe <io@richiejp.com>
2026-06-18 11:45:22 +01:00

285 lines
9.8 KiB
Go

package modeladmin
import (
"context"
"errors"
"fmt"
"os"
"path/filepath"
"reflect"
"strings"
"gopkg.in/yaml.v3"
"github.com/mudler/LocalAI/core/config"
"github.com/mudler/LocalAI/core/config/meta"
"github.com/mudler/LocalAI/core/gallery"
"github.com/mudler/LocalAI/pkg/model"
"github.com/mudler/LocalAI/pkg/utils"
)
// ConfigService groups operations that read or mutate an installed model's
// configuration on disk. It keeps the side-effect surface (loader reload,
// model shutdown) explicit so callers know what gets touched.
type ConfigService struct {
Loader *config.ModelConfigLoader
AppConfig *config.ApplicationConfig
}
// NewConfigService returns a ConfigService bound to the supplied loader and
// app config. The loader and the system state in AppConfig are mandatory; the
// model loader is required only by EditYAML and ToggleState (for Shutdown).
func NewConfigService(loader *config.ModelConfigLoader, appConfig *config.ApplicationConfig) *ConfigService {
return &ConfigService{Loader: loader, AppConfig: appConfig}
}
// ConfigView is the on-disk YAML plus the parsed JSON view, returned by GetConfig.
// The YAML is read from disk (not serialised from the in-memory loader) so
// callers see exactly what the user wrote — no SetDefaults() noise.
type ConfigView struct {
Name string
YAML string
JSON map[string]any
}
// EditResult is what EditYAML returns to its caller.
type EditResult struct {
Filename string
Renamed bool
OldName string
NewName string
Config config.ModelConfig
}
// modelsPath is shorthand for the configured models directory.
func (s *ConfigService) modelsPath() string {
return s.AppConfig.SystemState.Model.ModelsPath
}
// GetConfig reads the YAML for an installed model from disk and returns it
// alongside the parsed JSON view.
func (s *ConfigService) GetConfig(_ context.Context, name string) (*ConfigView, error) {
if name == "" {
return nil, ErrNameRequired
}
cfg, exists := s.Loader.GetModelConfig(name)
if !exists {
return nil, ErrNotFound
}
configPath := cfg.GetModelConfigFile()
if configPath == "" {
return nil, ErrConfigFileMissing
}
if err := utils.VerifyPath(configPath, s.modelsPath()); err != nil {
return nil, fmt.Errorf("%w: %v", ErrPathNotTrusted, err)
}
data, err := os.ReadFile(configPath)
if err != nil {
return nil, fmt.Errorf("read config file: %w", err)
}
var jsonView map[string]any
_ = yaml.Unmarshal(data, &jsonView)
return &ConfigView{Name: name, YAML: string(data), JSON: jsonView}, nil
}
// PatchConfig applies a JSON deep-merge to an installed model's YAML and
// reloads. Returns the merged config that's now in the loader.
//
// Mirrors PatchConfigEndpoint: read raw YAML from disk (not the in-memory
// config — which has SetDefaults applied and would persist runtime defaults
// like top_p/temperature/mirostat), deep-merge the patch, validate, write,
// reload, preload (preload errors are non-fatal — log only).
func (s *ConfigService) PatchConfig(_ context.Context, name string, patch map[string]any) (*config.ModelConfig, error) {
if name == "" {
return nil, ErrNameRequired
}
if len(patch) == 0 {
return nil, ErrEmptyBody
}
cfg, exists := s.Loader.GetModelConfig(name)
if !exists {
return nil, ErrNotFound
}
configPath := cfg.GetModelConfigFile()
if err := utils.VerifyPath(configPath, s.modelsPath()); err != nil {
return nil, fmt.Errorf("%w: %v", ErrPathNotTrusted, err)
}
diskYAML, err := os.ReadFile(configPath)
if err != nil {
return nil, fmt.Errorf("read config file: %w", err)
}
var existingMap map[string]any
if err := yaml.Unmarshal(diskYAML, &existingMap); err != nil {
return nil, fmt.Errorf("parse existing config: %w", err)
}
if existingMap == nil {
existingMap = map[string]any{}
}
patchMerge(existingMap, patch, mapLeafFieldPaths(), "")
yamlData, err := yaml.Marshal(existingMap)
if err != nil {
return nil, fmt.Errorf("marshal merged YAML: %w", err)
}
var updated config.ModelConfig
if err := yaml.Unmarshal(yamlData, &updated); err != nil {
return nil, fmt.Errorf("%w: %v", ErrInvalidConfig, err)
}
if valid, vErr := updated.Validate(); !valid {
if vErr != nil {
return nil, fmt.Errorf("%w: %v", ErrInvalidConfig, vErr)
}
return nil, ErrInvalidConfig
}
if err := writeFileAtomic(configPath, yamlData, 0644); err != nil {
return nil, fmt.Errorf("write config file: %w", err)
}
if err := s.Loader.LoadModelConfigsFromPath(s.modelsPath(), s.AppConfig.ToConfigLoaderOptions()...); err != nil {
return nil, fmt.Errorf("reload configs: %w", err)
}
// Preload is best-effort — a failure here doesn't undo the patch.
_ = s.Loader.Preload(s.modelsPath())
return &updated, nil
}
// mapLeafFieldPaths returns the set of dotted config paths whose schema type is
// a map that the editor edits as one complete value (e.g.
// pii_detection.entity_actions, roles, engine_args). A PATCH must REPLACE these
// wholesale rather than union them: the deep-merge only adds and overrides
// keys, so a map entry the admin deleted in the editor would otherwise silently
// survive. Derived from the config schema so it stays correct as map fields are
// added. (UIType comes from reflection, independent of any registry override.)
func mapLeafFieldPaths() map[string]struct{} {
md := meta.BuildConfigMetadata(reflect.TypeFor[config.ModelConfig]())
out := make(map[string]struct{})
for _, f := range md.Fields {
if f.UIType == "map" {
out[f.Path] = struct{}{}
}
}
return out
}
// patchMerge deep-merges src into dst with the same shape as the previous
// mergo.WithOverride behaviour — scalars and slices replace; nested
// struct-maps (e.g. pii_detection, parameters) recurse so unknown sibling keys
// the editor doesn't model survive — EXCEPT that any path in mapLeaves is
// replaced wholesale, and removed when the patch sets it empty, so deletions
// inside a map field persist to disk.
func patchMerge(dst, src map[string]any, mapLeaves map[string]struct{}, prefix string) {
for k, sv := range src {
path := k
if prefix != "" {
path = prefix + "." + k
}
if _, isLeaf := mapLeaves[path]; isLeaf {
if m, ok := sv.(map[string]any); ok && len(m) == 0 {
delete(dst, k) // emptied map field -> drop it from the YAML
} else {
dst[k] = sv
}
continue
}
// Recurse into struct-like nesting so dst-only sibling keys survive.
if sm, ok := sv.(map[string]any); ok {
if dm, ok2 := dst[k].(map[string]any); ok2 {
patchMerge(dm, sm, mapLeaves, path)
continue
}
}
dst[k] = sv
}
}
// EditYAML replaces the YAML for an installed model, with optional rename
// support. ml may be nil; when set, EditYAML calls ml.ShutdownModel(oldName)
// after a successful write so the next inference picks up the new config.
func (s *ConfigService) EditYAML(_ context.Context, name string, body []byte, ml *model.ModelLoader) (*EditResult, error) {
if name == "" {
return nil, ErrNameRequired
}
if len(body) == 0 {
return nil, ErrEmptyBody
}
existing, exists := s.Loader.GetModelConfig(name)
if !exists {
return nil, ErrNotFound
}
var req config.ModelConfig
if err := yaml.Unmarshal(body, &req); err != nil {
return nil, fmt.Errorf("%w: %v", ErrInvalidConfig, err)
}
if req.Name == "" {
return nil, fmt.Errorf("%w: name field is required", ErrInvalidConfig)
}
if valid, _ := req.Validate(); !valid {
return nil, ErrInvalidConfig
}
configPath := existing.GetModelConfigFile()
modelsPath := s.modelsPath()
if err := utils.VerifyPath(configPath, modelsPath); err != nil {
return nil, fmt.Errorf("%w: %v", ErrPathNotTrusted, err)
}
renamed := req.Name != name
if renamed {
if strings.ContainsRune(req.Name, os.PathSeparator) || strings.Contains(req.Name, "/") || strings.Contains(req.Name, "\\") {
return nil, ErrPathSeparator
}
if _, exists := s.Loader.GetModelConfig(req.Name); exists {
return nil, fmt.Errorf("%w: %q", ErrConflict, req.Name)
}
newConfigPath := filepath.Join(modelsPath, req.Name+".yaml")
if err := utils.VerifyPath(newConfigPath, modelsPath); err != nil {
return nil, fmt.Errorf("%w: %v", ErrPathNotTrusted, err)
}
if _, err := os.Stat(newConfigPath); err == nil {
return nil, fmt.Errorf("%w: a config file for %q already exists on disk", ErrConflict, req.Name)
} else if !errors.Is(err, os.ErrNotExist) {
return nil, fmt.Errorf("stat new config: %w", err)
}
if err := writeFileAtomic(newConfigPath, body, 0644); err != nil {
return nil, fmt.Errorf("write new config: %w", err)
}
if configPath != newConfigPath {
// Best-effort: a stale old file is cosmetic, not load-bearing.
_ = os.Remove(configPath)
}
// Move the gallery metadata file so the delete flow can still find it.
oldGalleryPath := filepath.Join(modelsPath, gallery.GalleryFileName(name))
newGalleryPath := filepath.Join(modelsPath, gallery.GalleryFileName(req.Name))
if _, err := os.Stat(oldGalleryPath); err == nil {
_ = os.Rename(oldGalleryPath, newGalleryPath)
}
// Drop the stale in-memory entry before reload so we don't surface
// both names between scan steps.
s.Loader.RemoveModelConfig(name)
configPath = newConfigPath
} else {
if err := writeFileAtomic(configPath, body, 0644); err != nil {
return nil, fmt.Errorf("write config: %w", err)
}
}
if err := s.Loader.LoadModelConfigsFromPath(modelsPath, s.AppConfig.ToConfigLoaderOptions()...); err != nil {
return nil, fmt.Errorf("reload configs: %w", err)
}
// Best-effort shutdown: the config is already written; if shutdown fails
// the caller can manually reload. The shutdown uses the OLD name because
// that's what the running instance was started with.
if ml != nil {
_ = ml.ShutdownModel(name)
}
if err := s.Loader.Preload(modelsPath); err != nil {
return nil, fmt.Errorf("preload after edit: %w", err)
}
return &EditResult{
Filename: configPath,
Renamed: renamed,
OldName: name,
NewName: req.Name,
Config: req,
}, nil
}