Load wrapper clients

mudler · mudler · commit 55509d373ef5 · 2024-11-11T19:12:43.000+01:00
Testing with:

```yaml
name: gpt-4o
pipeline:
 tts: voice-it-riccardo_fasol-x-low
 transcription: whisper-base-q5_1
 llm: llama-3.2-1b-instruct:q4_k_m
```

Signed-off-by: Ettore Di Giacinto &lt;mudler@localai.io&gt;
diff --git a/core/config/backend_config.go b/core/config/backend_config.go
@@ -79,7 +79,7 @@ type BackendConfig struct {
 type Pipeline struct {
 	TTS           string `yaml:"tts"`
 	LLM           string `yaml:"llm"`
-	Transcription string `yaml:"sst"`
+	Transcription string `yaml:"transcription"`
 }
 
 type File struct {
diff --git a/core/http/endpoints/openai/realtime.go b/core/http/endpoints/openai/realtime.go
@@ -10,7 +10,9 @@ import (
 	"github.com/gofiber/websocket/v2"
 	"github.com/mudler/LocalAI/core/backend"
 	"github.com/mudler/LocalAI/core/config"
+	grpc "github.com/mudler/LocalAI/pkg/grpc"
 	model "github.com/mudler/LocalAI/pkg/model"
+
 	"github.com/rs/zerolog/log"
 )
 
@@ -111,13 +113,17 @@ type Model interface {
 }
 
 type wrappedModel struct {
-	TTS *config.BackendConfig
-	SST *config.BackendConfig
-	LLM *config.BackendConfig
+	TTSConfig           *config.BackendConfig
+	TranscriptionConfig *config.BackendConfig
+	LLMConfig           *config.BackendConfig
+	TTSClient           grpc.Backend
+	TranscriptionClient grpc.Backend
+	LLMClient           grpc.Backend
 }
 
 // returns and loads either a wrapped model or a model that support audio-to-audio
 func newModel(cl *config.BackendConfigLoader, ml *model.ModelLoader, appConfig *config.ApplicationConfig, modelName string) (Model, error) {
+
 	cfg, err := cl.LoadBackendConfigFileByName(modelName, ml.ModelPath)
 	if err != nil {
 		return nil, fmt.Errorf("failed to load backend config: %w", err)
@@ -134,6 +140,8 @@ func newModel(cl *config.BackendConfigLoader, ml *model.ModelLoader, appConfig *
 		return ml.BackendLoader(opts...)
 	}
 
+	log.Debug().Msg("Loading a wrapped model")
+
 	// Otherwise we want to return a wrapped model, which is a "virtual" model that re-uses other models to perform operations
 	cfgLLM, err := cl.LoadBackendConfigFileByName(cfg.Pipeline.LLM, ml.ModelPath)
 	if err != nil {
@@ -165,10 +173,31 @@ func newModel(cl *config.BackendConfigLoader, ml *model.ModelLoader, appConfig *
 		return nil, fmt.Errorf("failed to validate config: %w", err)
 	}
 
+	opts := backend.ModelOptions(*cfgTTS, appConfig)
+	ttsClient, err := ml.BackendLoader(opts...)
+	if err != nil {
+		return nil, fmt.Errorf("failed to load tts model: %w", err)
+	}
+
+	opts = backend.ModelOptions(*cfgSST, appConfig)
+	transcriptionClient, err := ml.BackendLoader(opts...)
+	if err != nil {
+		return nil, fmt.Errorf("failed to load SST model: %w", err)
+	}
+
+	opts = backend.ModelOptions(*cfgLLM, appConfig)
+	llmClient, err := ml.BackendLoader(opts...)
+	if err != nil {
+		return nil, fmt.Errorf("failed to load LLM model: %w", err)
+	}
+
 	return &wrappedModel{
-		TTS: cfgTTS,
-		SST: cfgSST,
-		LLM: cfgLLM,
+		TTSConfig:           cfgTTS,
+		TranscriptionConfig: cfgSST,
+		LLMConfig:           cfgLLM,
+		TTSClient:           ttsClient,
+		TranscriptionClient: transcriptionClient,
+		LLMClient:           llmClient,
 	}, nil
 }
 

Original file line number	Diff line number	Diff line change
`@@ -79,7 +79,7 @@ type BackendConfig struct {`
`79`	`79`	`type Pipeline struct {`
`80`	`80`	TTS string `yaml:"tts"`
`81`	`81`	LLM string `yaml:"llm"`
`82`		- Transcription string `yaml:"sst"`
	`82`	+ Transcription string `yaml:"transcription"`
`83`	`83`	`}`
`84`	`84`
`85`	`85`	`type File struct {`