mudler
diff --git a/‎.bruno/LocalAI Test Requests/vad/vad test audio.bru‎
Lines changed: 240024 additions & 0 deletions b/‎.bruno/LocalAI Test Requests/vad/vad test audio.bru‎
Lines changed: 240024 additions & 0 deletions
diff --git a/‎.bruno/LocalAI Test Requests/vad/vad test too few.bru‎
Lines changed: 22 additions & 0 deletions b/‎.bruno/LocalAI Test Requests/vad/vad test too few.bru‎
Lines changed: 22 additions & 0 deletions
diff --git a/‎aio/cpu/vad.yaml‎
Lines changed: 8 additions & 0 deletions b/‎aio/cpu/vad.yaml‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎aio/entrypoint.sh‎
Lines changed: 1 addition & 1 deletion b/‎aio/entrypoint.sh‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎aio/gpu-8g/vad.yaml‎
Lines changed: 8 additions & 0 deletions b/‎aio/gpu-8g/vad.yaml‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎aio/intel/vad.yaml‎
Lines changed: 8 additions & 0 deletions b/‎aio/intel/vad.yaml‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎core/application/startup.go‎
Lines changed: 1 addition & 7 deletions b/‎core/application/startup.go‎
Lines changed: 1 addition & 7 deletions
diff --git a/‎core/backend/llm.go‎
Lines changed: 3 additions & 3 deletions b/‎core/backend/llm.go‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎core/backend/rerank.go‎
Lines changed: 3 additions & 3 deletions b/‎core/backend/rerank.go‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎core/backend/soundgeneration.go‎
Lines changed: 3 additions & 3 deletions b/‎core/backend/soundgeneration.go‎
Lines changed: 3 additions & 3 deletions
@@ -0,0 +1,22 @@
+meta {
+  name: vad test too few
+  type: http
+  seq: 1
+}
+
+post {
+  url: {{PROTOCOL}}{{HOST}}:{{PORT}}/vad
+  body: json
+  auth: none
+}
+
+headers {
+  Content-Type: application/json
+}
+
+body:json {
+  {
+      "model": "silero-vad",
+      "audio": []
+  }
+}
@@ -0,0 +1,8 @@
+backend: silero-vad
+name: silero-vad
+parameters:
+  model: silero-vad.onnx
+download_files:
+- filename: silero-vad.onnx
+  uri: https://huggingface.co/onnx-community/silero-vad/resolve/main/onnx/model.onnx
+  sha256: a4a068cd6cf1ea8355b84327595838ca748ec29a25bc91fc82e6c299ccdc5808
@@ -129,7 +129,7 @@ detect_gpu
 detect_gpu_size
 
 PROFILE="${PROFILE:-$GPU_SIZE}" # default to cpu
-export MODELS="${MODELS:-/aio/${PROFILE}/embeddings.yaml,/aio/${PROFILE}/rerank.yaml,/aio/${PROFILE}/text-to-speech.yaml,/aio/${PROFILE}/image-gen.yaml,/aio/${PROFILE}/text-to-text.yaml,/aio/${PROFILE}/speech-to-text.yaml,/aio/${PROFILE}/vision.yaml}"
+export MODELS="${MODELS:-/aio/${PROFILE}/embeddings.yaml,/aio/${PROFILE}/rerank.yaml,/aio/${PROFILE}/text-to-speech.yaml,/aio/${PROFILE}/image-gen.yaml,/aio/${PROFILE}/text-to-text.yaml,/aio/${PROFILE}/speech-to-text.yaml,/aio/${PROFILE}/vad.yaml,/aio/${PROFILE}/vision.yaml}"
 
 check_vars
 
 
@@ -0,0 +1,8 @@
+backend: silero-vad
+name: silero-vad
+parameters:
+  model: silero-vad.onnx
+download_files:
+- filename: silero-vad.onnx
+  uri: https://huggingface.co/onnx-community/silero-vad/resolve/main/onnx/model.onnx
+  sha256: a4a068cd6cf1ea8355b84327595838ca748ec29a25bc91fc82e6c299ccdc5808
@@ -0,0 +1,8 @@
+backend: silero-vad
+name: silero-vad
+parameters:
+  model: silero-vad.onnx
+download_files:
+- filename: silero-vad.onnx
+  uri: https://huggingface.co/onnx-community/silero-vad/resolve/main/onnx/model.onnx
+  sha256: a4a068cd6cf1ea8355b84327595838ca748ec29a25bc91fc82e6c299ccdc5808
@@ -145,13 +145,7 @@ func New(opts ...config.AppOption) (*Application, error) {
 
 	if options.LoadToMemory != nil {
 		for _, m := range options.LoadToMemory {
-			cfg, err := application.BackendLoader().LoadBackendConfigFileByName(m, options.ModelPath,
-				config.LoadOptionDebug(options.Debug),
-				config.LoadOptionThreads(options.Threads),
-				config.LoadOptionContextSize(options.ContextSize),
-				config.LoadOptionF16(options.F16),
-				config.ModelPath(options.ModelPath),
-			)
+			cfg, err := application.BackendLoader().LoadBackendConfigFileByNameDefaultOptions(m, options)
 			if err != nil {
 				return nil, err
 			}
 
@@ -33,7 +33,7 @@ type TokenUsage struct {
 	TimingTokenGeneration  float64
 }
 
-func ModelInference(ctx context.Context, s string, messages []schema.Message, images, videos, audios []string, loader *model.ModelLoader, c config.BackendConfig, o *config.ApplicationConfig, tokenCallback func(string, TokenUsage) bool) (func() (LLMResponse, error), error) {
+func ModelInference(ctx context.Context, s string, messages []schema.Message, images, videos, audios []string, loader *model.ModelLoader, c *config.BackendConfig, o *config.ApplicationConfig, tokenCallback func(string, TokenUsage) bool) (func() (LLMResponse, error), error) {
 	modelFile := c.Model
 
 	// Check if the modelFile exists, if it doesn't try to load it from the gallery
@@ -48,7 +48,7 @@ func ModelInference(ctx context.Context, s string, messages []schema.Message, im
 		}
 	}
 
-	opts := ModelOptions(c, o)
+	opts := ModelOptions(*c, o)
 	inferenceModel, err := loader.Load(opts...)
 	if err != nil {
 		return nil, err
@@ -84,7 +84,7 @@ func ModelInference(ctx context.Context, s string, messages []schema.Message, im
 
 	// in GRPC, the backend is supposed to answer to 1 single token if stream is not supported
 	fn := func() (LLMResponse, error) {
-		opts := gRPCPredictOpts(c, loader.ModelPath)
+		opts := gRPCPredictOpts(*c, loader.ModelPath)
 		opts.Prompt = s
 		opts.Messages = protoMessages
 		opts.UseTokenizerTemplate = c.TemplateConfig.UseTokenizerTemplate
 
@@ -9,10 +9,10 @@ import (
 	model "github.com/mudler/LocalAI/pkg/model"
 )
 
-func Rerank(modelFile string, request *proto.RerankRequest, loader *model.ModelLoader, appConfig *config.ApplicationConfig, backendConfig config.BackendConfig) (*proto.RerankResult, error) {
-
-	opts := ModelOptions(backendConfig, appConfig, model.WithModel(modelFile))
+func Rerank(request *proto.RerankRequest, loader *model.ModelLoader, appConfig *config.ApplicationConfig, backendConfig config.BackendConfig) (*proto.RerankResult, error) {
+	opts := ModelOptions(backendConfig, appConfig)
 	rerankModel, err := loader.Load(opts...)
+
 	if err != nil {
 		return nil, err
 	}
 
@@ -13,7 +13,6 @@ import (
 )
 
 func SoundGeneration(
-	modelFile string,
 	text string,
 	duration *float32,
 	temperature *float32,
@@ -25,8 +24,9 @@ func SoundGeneration(
 	backendConfig config.BackendConfig,
 ) (string, *proto.Result, error) {
 
-	opts := ModelOptions(backendConfig, appConfig, model.WithModel(modelFile))
+	opts := ModelOptions(backendConfig, appConfig)
 	soundGenModel, err := loader.Load(opts...)
+
 	if err != nil {
 		return "", nil, err
 	}
@@ -44,7 +44,7 @@ func SoundGeneration(
 
 	res, err := soundGenModel.SoundGeneration(context.Background(), &proto.SoundGenerationRequest{
 		Text:        text,
-		Model:       modelFile,
+		Model:       backendConfig.Model,
 		Dst:         filePath,
 		Sample:      doSample,
 		Duration:    duration,
Original file line number	Diff line number	Diff line change
`@@ -9,10 +9,10 @@ import (`
`9`	`9`	`model "github.com/mudler/LocalAI/pkg/model"`
`10`	`10`	`)`
`11`	`11`
`12`		`-func Rerank(modelFile string, request proto.RerankRequest, loader model.ModelLoader, appConfig config.ApplicationConfig, backendConfig config.BackendConfig) (proto.RerankResult, error) {`
`13`		`-`
`14`		`- opts := ModelOptions(backendConfig, appConfig, model.WithModel(modelFile))`
	`12`	`+func Rerank(request proto.RerankRequest, loader model.ModelLoader, appConfig config.ApplicationConfig, backendConfig config.BackendConfig) (proto.RerankResult, error) {`
	`13`	`+ opts := ModelOptions(backendConfig, appConfig)`
`15`	`14`	`rerankModel, err := loader.Load(opts...)`
	`15`	`+`
`16`	`16`	`if err != nil {`
`17`	`17`	`return nil, err`
`18`	`18`	`}`