LocalAI/backend/go/omnivoice-cpp/e2e_test.go

package main

import (
	"os"
	"strings"

	"github.com/ebitengine/purego"
	pb "github.com/mudler/LocalAI/pkg/grpc/proto"
	. "github.com/onsi/ginkgo/v2"
	. "github.com/onsi/gomega"
)

func ttsReq(text, voice string, lang *string, dst string) *pb.TTSRequest {
	return &pb.TTSRequest{Text: text, Voice: voice, Language: lang, Dst: dst}
}

var _ = Describe("OmniVoice e2e", Label("e2e"), func() {
	var loaded bool

	BeforeEach(func() {
		modelPath := os.Getenv("OMNIVOICE_MODEL")
		codecPath := os.Getenv("OMNIVOICE_CODEC")
		if modelPath == "" || codecPath == "" {
			Skip("OMNIVOICE_MODEL / OMNIVOICE_CODEC not set; skipping e2e")
		}
		if !loaded {
			lib := os.Getenv("OMNIVOICE_LIBRARY")
			if lib == "" {
				lib = "./libgomnivoicecpp-fallback.so"
			}
			h, err := purego.Dlopen(lib, purego.RTLD_NOW|purego.RTLD_GLOBAL)
			Expect(err).ToNot(HaveOccurred())
			purego.RegisterLibFunc(&CppLoad, h, "omni_load")
			purego.RegisterLibFunc(&CppTTS, h, "omni_tts")
			purego.RegisterLibFunc(&CppTTSStream, h, "omni_tts_stream")
			purego.RegisterLibFunc(&CppPCMFree, h, "omni_pcm_free")
			purego.RegisterLibFunc(&CppUnload, h, "omni_unload")
			Expect(CppLoad(modelPath, codecPath, 0, 0)).To(Equal(0))
			loaded = true
		}
	})

	It("synthesizes a WAV file via TTS", func() {
		b := &OmnivoiceCpp{opts: loadOptions{seed: 42, denoise: true}}
		dst := GinkgoT().TempDir() + "/out.wav"
		lang := "en"
		err := b.TTS(ttsReq("Hello world.", "", &lang, dst))
		Expect(err).ToNot(HaveOccurred())
		fi, err := os.Stat(dst)
		Expect(err).ToNot(HaveOccurred())
		Expect(fi.Size()).To(BeNumerically(">", int64(44)))
	})

	It("streams audio chunks via TTSStream", func() {
		b := &OmnivoiceCpp{opts: loadOptions{seed: 42, denoise: true}}
		results := make(chan []byte, 1024)
		lang := "en"
		done := make(chan error, 1)
		go func() { done <- b.TTSStream(ttsReq("Hello there, streaming test.", "", &lang, ""), results) }()

		var chunks int
		var first []byte
		for c := range results {
			if chunks == 0 {
				first = c
			}
			chunks++
		}
		Expect(<-done).ToNot(HaveOccurred())
		Expect(chunks).To(BeNumerically(">=", 2))
		Expect(string(first[0:4])).To(Equal("RIFF"))
		Expect(strings.HasPrefix(string(first[8:12]), "WAVE")).To(BeTrue())
	})
})