mirror of
https://github.com/ollama/ollama.git
synced 2026-02-19 15:57:07 -05:00
This change adds a new MLX based runner which includes: * Method-based MLX bindings * Subprocess-based MLX runner (x/mlxrunner) * KV cache with tree management * A basic sampler The GLM4-MoE-Lite model has been ported to use the new bindings. --------- Co-authored-by: Michael Yang <git@mxy.ng>
27 lines
561 B
Go
27 lines
561 B
Go
package runner
|
|
|
|
import (
|
|
"github.com/ollama/ollama/runner/llamarunner"
|
|
"github.com/ollama/ollama/runner/ollamarunner"
|
|
"github.com/ollama/ollama/x/imagegen"
|
|
"github.com/ollama/ollama/x/mlxrunner"
|
|
)
|
|
|
|
func Execute(args []string) error {
|
|
if args[0] == "runner" {
|
|
args = args[1:]
|
|
}
|
|
|
|
if len(args) > 0 {
|
|
switch args[0] {
|
|
case "--ollama-engine":
|
|
return ollamarunner.Execute(args[1:])
|
|
case "--imagegen-engine":
|
|
return imagegen.Execute(args[1:])
|
|
case "--mlx-engine":
|
|
return mlxrunner.Execute(args[1:])
|
|
}
|
|
}
|
|
return llamarunner.Execute(args)
|
|
}
|