mirror of
https://github.com/mudler/LocalAI.git
synced 2026-04-04 23:14:41 -04:00
* feat(audio): set audio content type Signed-off-by: Ettore Di Giacinto <mudler@localai.io> * chore: add tests Signed-off-by: Ettore Di Giacinto <mudler@localai.io> --------- Signed-off-by: Ettore Di Giacinto <mudler@localai.io>
63 lines
2.0 KiB
Go
63 lines
2.0 KiB
Go
package elevenlabs
|
|
|
|
import (
|
|
"path/filepath"
|
|
|
|
"github.com/labstack/echo/v4"
|
|
"github.com/mudler/LocalAI/core/backend"
|
|
"github.com/mudler/LocalAI/core/config"
|
|
"github.com/mudler/LocalAI/core/http/middleware"
|
|
"github.com/mudler/LocalAI/core/schema"
|
|
"github.com/mudler/LocalAI/pkg/audio"
|
|
"github.com/mudler/LocalAI/pkg/model"
|
|
"github.com/mudler/xlog"
|
|
)
|
|
|
|
// SoundGenerationEndpoint is the ElevenLabs SoundGeneration endpoint https://elevenlabs.io/docs/api-reference/sound-generation
|
|
// @Summary Generates audio from the input text.
|
|
// @Param request body schema.ElevenLabsSoundGenerationRequest true "query params"
|
|
// @Success 200 {string} binary "Response"
|
|
// @Router /v1/sound-generation [post]
|
|
func SoundGenerationEndpoint(cl *config.ModelConfigLoader, ml *model.ModelLoader, appConfig *config.ApplicationConfig) echo.HandlerFunc {
|
|
return func(c echo.Context) error {
|
|
|
|
input, ok := c.Get(middleware.CONTEXT_LOCALS_KEY_LOCALAI_REQUEST).(*schema.ElevenLabsSoundGenerationRequest)
|
|
if !ok || input.ModelID == "" {
|
|
return echo.ErrBadRequest
|
|
}
|
|
|
|
cfg, ok := c.Get(middleware.CONTEXT_LOCALS_KEY_MODEL_CONFIG).(*config.ModelConfig)
|
|
if !ok || cfg == nil {
|
|
return echo.ErrBadRequest
|
|
}
|
|
|
|
xlog.Debug("Sound Generation Request about to be sent to backend", "modelFile", "modelFile", "backend", cfg.Backend)
|
|
|
|
language := input.Language
|
|
if language == "" {
|
|
language = input.VocalLanguage
|
|
}
|
|
var bpm *int32
|
|
if input.BPM != nil {
|
|
b := int32(*input.BPM)
|
|
bpm = &b
|
|
}
|
|
filePath, _, err := backend.SoundGeneration(
|
|
input.Text, input.Duration, input.Temperature, input.DoSample,
|
|
nil, nil,
|
|
input.Think, input.Caption, input.Lyrics, bpm, input.Keyscale,
|
|
language, input.Timesignature,
|
|
input.Instrumental,
|
|
ml, appConfig, *cfg)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
filePath, contentType := audio.NormalizeAudioFile(filePath)
|
|
if contentType != "" {
|
|
c.Response().Header().Set("Content-Type", contentType)
|
|
}
|
|
return c.Attachment(filePath, filepath.Base(filePath))
|
|
}
|
|
}
|