LocalAI/pkg/grpc/llm/bert/bert.go

package bert

// This is a wrapper to statisfy the GRPC service interface
// It is meant to be used by the main executable that is the server for the specific backend type (falcon, gpt3, etc)
import (
	bert "github.com/go-skynet/go-bert.cpp"
	"github.com/rs/zerolog/log"

	"github.com/go-skynet/LocalAI/pkg/grpc/base"
	pb "github.com/go-skynet/LocalAI/pkg/grpc/proto"
)

type Embeddings struct {
	base.Base
	bert *bert.Bert
}

func (llm *Embeddings) Load(opts *pb.ModelOptions) error {
	if llm.Base.State != pb.StatusResponse_UNINITIALIZED {
		log.Warn().Msgf("bert backend loading %s while already in state %s!", opts.Model, llm.Base.State.String())
	}

	llm.Base.Lock()
	defer llm.Base.Unlock()
	model, err := bert.New(opts.ModelFile)
	llm.bert = model
	return err
}

func (llm *Embeddings) Embeddings(opts *pb.PredictOptions) ([]float32, error) {
	llm.Base.Lock()
	defer llm.Base.Unlock()

	if len(opts.EmbeddingTokens) > 0 {
		tokens := []int{}
		for _, t := range opts.EmbeddingTokens {
			tokens = append(tokens, int(t))
		}
		return llm.bert.TokenEmbeddings(tokens, bert.SetThreads(int(opts.Threads)))
	}

	return llm.bert.Embeddings(opts.Embeddings, bert.SetThreads(int(opts.Threads)))
}
feat: move other backends to grpc This finally makes everything more consistent Signed-off-by: Ettore Di Giacinto <mudler@localai.io> 2023-07-14 23:19:43 +00:00			`package bert`

			`// This is a wrapper to statisfy the GRPC service interface`
			`// It is meant to be used by the main executable that is the server for the specific backend type (falcon, gpt3, etc)`
			`import (`
			`bert "github.com/go-skynet/go-bert.cpp"`
Usage Features (#863) 2023-08-18 19:23:14 +00:00			`"github.com/rs/zerolog/log"`
feat: move other backends to grpc This finally makes everything more consistent Signed-off-by: Ettore Di Giacinto <mudler@localai.io> 2023-07-14 23:19:43 +00:00
			`"github.com/go-skynet/LocalAI/pkg/grpc/base"`
			`pb "github.com/go-skynet/LocalAI/pkg/grpc/proto"`
			`)`

			`type Embeddings struct {`
			`base.Base`
			`bert *bert.Bert`
			`}`

			`func (llm Embeddings) Load(opts pb.ModelOptions) error {`
Usage Features (#863) 2023-08-18 19:23:14 +00:00			`if llm.Base.State != pb.StatusResponse_UNINITIALIZED {`
			`log.Warn().Msgf("bert backend loading %s while already in state %s!", opts.Model, llm.Base.State.String())`
			`}`

			`llm.Base.Lock()`
			`defer llm.Base.Unlock()`
feat: add initial AutoGPTQ backend implementation 2023-08-07 20:39:10 +00:00			`model, err := bert.New(opts.ModelFile)`
feat: move other backends to grpc This finally makes everything more consistent Signed-off-by: Ettore Di Giacinto <mudler@localai.io> 2023-07-14 23:19:43 +00:00			`llm.bert = model`
			`return err`
			`}`

			`func (llm Embeddings) Embeddings(opts pb.PredictOptions) ([]float32, error) {`
Usage Features (#863) 2023-08-18 19:23:14 +00:00			`llm.Base.Lock()`
			`defer llm.Base.Unlock()`

feat: move other backends to grpc This finally makes everything more consistent Signed-off-by: Ettore Di Giacinto <mudler@localai.io> 2023-07-14 23:19:43 +00:00			`if len(opts.EmbeddingTokens) > 0 {`
			`tokens := []int{}`
			`for _, t := range opts.EmbeddingTokens {`
			`tokens = append(tokens, int(t))`
			`}`
			`return llm.bert.TokenEmbeddings(tokens, bert.SetThreads(int(opts.Threads)))`
			`}`

			`return llm.bert.Embeddings(opts.Embeddings, bert.SetThreads(int(opts.Threads)))`
			`}`