fix(p2p): adapt to backend changes, general improvements (#5889)

The binary is now named "llama-cpp-rpc-server" for p2p workers.

We also decrease the default token rotation interval, in this way
peer discovery is much more responsive.

Signed-off-by: Ettore Di Giacinto <mudler@localai.io>
This commit is contained in:
Ettore Di Giacinto
2025-07-23 12:40:32 +02:00
committed by GitHub
parent c717b8d800
commit 5f7ece3e94
5 changed files with 63 additions and 11 deletions

View File

@@ -1,6 +1,7 @@
package worker
import (
"errors"
"fmt"
"os"
"path/filepath"
@@ -16,6 +17,10 @@ type LLamaCPP struct {
WorkerFlags `embed:""`
}
const (
llamaCPPRPCBinaryName = "llama-cpp-rpc-server"
)
func findLLamaCPPBackend(backendSystemPath string) (string, error) {
backends, err := gallery.ListSystemBackends(backendSystemPath)
if err != nil {
@@ -33,12 +38,12 @@ func findLLamaCPPBackend(backendSystemPath string) (string, error) {
}
if backendPath == "" {
return "", fmt.Errorf("llama-cpp backend not found")
return "", errors.New("llama-cpp backend not found, install it first")
}
grpcProcess := filepath.Join(
backendPath,
"grpc-server",
llamaCPPRPCBinaryName,
)
return grpcProcess, nil

View File

@@ -31,7 +31,7 @@ func generateNewConnectionData(DHTInterval, OTPInterval int) *node.YAMLConnectio
maxMessSize := 20 << 20 // 20MB
keyLength := 43
if DHTInterval == 0 {
DHTInterval = 360
DHTInterval = 30
}
if OTPInterval == 0 {
OTPInterval = 9000
@@ -377,7 +377,7 @@ func newNodeOpts(token string) ([]node.Option, error) {
// TODO: move this up, expose more config options when creating a node
noDHT := os.Getenv("LOCALAI_P2P_DISABLE_DHT") == "true"
noLimits := os.Getenv("LOCALAI_P2P_ENABLE_LIMITS") == "true"
noLimits := os.Getenv("LOCALAI_P2P_ENABLE_LIMITS") != "true"
var listenMaddrs []string
var bootstrapPeers []string