2023-07-14 23:19:43 +00:00
|
|
|
package backend
|
|
|
|
|
|
|
|
import (
|
|
|
|
"fmt"
|
|
|
|
|
|
|
|
config "github.com/go-skynet/LocalAI/api/config"
|
|
|
|
"github.com/go-skynet/LocalAI/api/options"
|
|
|
|
"github.com/go-skynet/LocalAI/pkg/grpc"
|
|
|
|
model "github.com/go-skynet/LocalAI/pkg/model"
|
|
|
|
)
|
|
|
|
|
|
|
|
func ModelEmbedding(s string, tokens []int, loader *model.ModelLoader, c config.Config, o *options.Option) (func() ([]float32, error), error) {
|
|
|
|
if !c.Embeddings {
|
|
|
|
return nil, fmt.Errorf("endpoint disabled for this model by API configuration")
|
|
|
|
}
|
|
|
|
|
|
|
|
modelFile := c.Model
|
|
|
|
|
|
|
|
grpcOpts := gRPCModelOpts(c)
|
|
|
|
|
|
|
|
var inferenceModel interface{}
|
|
|
|
var err error
|
|
|
|
|
|
|
|
opts := []model.Option{
|
2023-08-09 06:38:51 +00:00
|
|
|
model.WithLoadGRPCLoadModelOpts(grpcOpts),
|
2023-07-14 23:19:43 +00:00
|
|
|
model.WithThreads(uint32(c.Threads)),
|
|
|
|
model.WithAssetDir(o.AssetsDestination),
|
2023-08-07 20:39:10 +00:00
|
|
|
model.WithModel(modelFile),
|
2023-07-14 23:19:43 +00:00
|
|
|
model.WithContext(o.Context),
|
2023-07-14 23:19:43 +00:00
|
|
|
}
|
|
|
|
|
2023-08-15 23:11:32 +00:00
|
|
|
if c.GRPC.Attempts != 0 {
|
|
|
|
opts = append(opts, model.WithGRPCAttempts(c.GRPC.Attempts))
|
|
|
|
}
|
|
|
|
|
|
|
|
if c.GRPC.AttemptsSleepTime != 0 {
|
|
|
|
opts = append(opts, model.WithGRPCAttemptsDelay(c.GRPC.AttemptsSleepTime))
|
|
|
|
}
|
|
|
|
|
2023-07-20 20:10:12 +00:00
|
|
|
for k, v := range o.ExternalGRPCBackends {
|
|
|
|
opts = append(opts, model.WithExternalBackend(k, v))
|
|
|
|
}
|
|
|
|
|
2023-07-14 23:19:43 +00:00
|
|
|
if c.Backend == "" {
|
|
|
|
inferenceModel, err = loader.GreedyLoader(opts...)
|
|
|
|
} else {
|
|
|
|
opts = append(opts, model.WithBackendString(c.Backend))
|
|
|
|
inferenceModel, err = loader.BackendLoader(opts...)
|
|
|
|
}
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
var fn func() ([]float32, error)
|
|
|
|
switch model := inferenceModel.(type) {
|
|
|
|
case *grpc.Client:
|
|
|
|
fn = func() ([]float32, error) {
|
|
|
|
predictOptions := gRPCPredictOpts(c, loader.ModelPath)
|
|
|
|
if len(tokens) > 0 {
|
|
|
|
embeds := []int32{}
|
|
|
|
|
|
|
|
for _, t := range tokens {
|
|
|
|
embeds = append(embeds, int32(t))
|
|
|
|
}
|
|
|
|
predictOptions.EmbeddingTokens = embeds
|
|
|
|
|
2023-07-14 23:19:43 +00:00
|
|
|
res, err := model.Embeddings(o.Context, predictOptions)
|
2023-07-14 23:19:43 +00:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
return res.Embeddings, nil
|
|
|
|
}
|
|
|
|
predictOptions.Embeddings = s
|
|
|
|
|
2023-07-14 23:19:43 +00:00
|
|
|
res, err := model.Embeddings(o.Context, predictOptions)
|
2023-07-14 23:19:43 +00:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
return res.Embeddings, nil
|
|
|
|
}
|
|
|
|
default:
|
|
|
|
fn = func() ([]float32, error) {
|
|
|
|
return nil, fmt.Errorf("embeddings not supported by the backend")
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return func() ([]float32, error) {
|
|
|
|
embeds, err := fn()
|
|
|
|
if err != nil {
|
|
|
|
return embeds, err
|
|
|
|
}
|
|
|
|
// Remove trailing 0s
|
|
|
|
for i := len(embeds) - 1; i >= 0; i-- {
|
|
|
|
if embeds[i] == 0.0 {
|
|
|
|
embeds = embeds[:i]
|
|
|
|
} else {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return embeds, nil
|
|
|
|
}, nil
|
|
|
|
}
|