LocalAI/core/backend/transcript.go

package backend

import (
	"context"
	"fmt"

	"github.com/go-skynet/LocalAI/core/config"
	"github.com/go-skynet/LocalAI/core/schema"

	"github.com/go-skynet/LocalAI/pkg/concurrency"
	"github.com/go-skynet/LocalAI/pkg/grpc/proto"
	"github.com/go-skynet/LocalAI/pkg/model"
)

type TranscriptionBackendService struct {
	ml        *model.ModelLoader
	bcl       *config.BackendConfigLoader
	appConfig *config.ApplicationConfig
}

func NewTranscriptionBackendService(ml *model.ModelLoader, bcl *config.BackendConfigLoader, appConfig *config.ApplicationConfig) *TranscriptionBackendService {
	return &TranscriptionBackendService{
		ml:        ml,
		bcl:       bcl,
		appConfig: appConfig,
	}
}

func (tbs *TranscriptionBackendService) Transcribe(request *schema.OpenAIRequest) <-chan concurrency.ErrorOr[*schema.TranscriptionResult] {
	responseChannel := make(chan concurrency.ErrorOr[*schema.TranscriptionResult])
	go func(request *schema.OpenAIRequest) {
		bc, request, err := tbs.bcl.LoadBackendConfigForModelAndOpenAIRequest(request.Model, request, tbs.appConfig)
		if err != nil {
			responseChannel <- concurrency.ErrorOr[*schema.TranscriptionResult]{Error: fmt.Errorf("failed reading parameters from request:%w", err)}
			close(responseChannel)
			return
		}

		tr, err := modelTranscription(request.File, request.Language, tbs.ml, bc, tbs.appConfig)
		if err != nil {
			responseChannel <- concurrency.ErrorOr[*schema.TranscriptionResult]{Error: err}
			close(responseChannel)
			return
		}
		responseChannel <- concurrency.ErrorOr[*schema.TranscriptionResult]{Value: tr}
		close(responseChannel)
	}(request)
	return responseChannel
}

func modelTranscription(audio, language string, ml *model.ModelLoader, backendConfig *config.BackendConfig, appConfig *config.ApplicationConfig) (*schema.TranscriptionResult, error) {

	opts := modelOpts(backendConfig, appConfig, []model.Option{
		model.WithBackendString(model.WhisperBackend),
		model.WithModel(backendConfig.Model),
		model.WithContext(appConfig.Context),
		model.WithThreads(uint32(*backendConfig.Threads)),
		model.WithAssetDir(appConfig.AssetsDestination),
	})

	whisperModel, err := ml.BackendLoader(opts...)
	if err != nil {
		return nil, err
	}

	if whisperModel == nil {
		return nil, fmt.Errorf("could not load whisper model")
	}

	return whisperModel.AudioTranscription(context.Background(), &proto.TranscriptRequest{
		Dst:      audio,
		Language: language,
		Threads:  uint32(*backendConfig.Threads),
	})
}
Revert "[Refactor]: Core/API Split" (#1550) Revert "[Refactor]: Core/API Split (#1506)" This reverts commit ab7b4d5ee9448e533a342bd1771393acd2967191. 2024-01-05 17:04:46 +00:00			`package backend`

			`import (`
			`"context"`
			`"fmt"`

refactor: move remaining api packages to core (#1731) * core 1 * api/openai/files fix * core 2 - core/config * move over core api.go and tests to the start of core/http * move over localai specific endpoints to core/http, begin the service/endpoint split there * refactor big chunk on the plane * refactor chunk 2 on plane, next step: port and modify changes to request.go * easy fixes for request.go, major changes not done yet * lintfix * json tag lintfix? * gitignore and .keep files * strange fix attempt: rename the config dir? 2024-03-01 15:19:53 +00:00			`"github.com/go-skynet/LocalAI/core/config"`
MQTT Startup Refactoring Part 1: core/ packages part 1 (#1728) This PR specifically introduces a `core` folder and moves the following packages over, without any other changes: - `api/backend` - `api/config` - `api/options` - `api/schema` Once this is merged and we confirm there's no regressions, I can migrate over the remaining changes piece by piece to split up application startup, backend services, http, and mqtt as was the goal of the earlier PRs! 2024-02-21 01:21:19 +00:00			`"github.com/go-skynet/LocalAI/core/schema"`
Revert "[Refactor]: Core/API Split" (#1550) Revert "[Refactor]: Core/API Split (#1506)" This reverts commit ab7b4d5ee9448e533a342bd1771393acd2967191. 2024-01-05 17:04:46 +00:00
refactor: backend/service split, channel-based llm flow (#1963) Refactor: channel based llm flow and services split --------- Signed-off-by: Dave Lee <dave@gray101.com> 2024-04-13 07:45:34 +00:00			`"github.com/go-skynet/LocalAI/pkg/concurrency"`
Revert "[Refactor]: Core/API Split" (#1550) Revert "[Refactor]: Core/API Split (#1506)" This reverts commit ab7b4d5ee9448e533a342bd1771393acd2967191. 2024-01-05 17:04:46 +00:00			`"github.com/go-skynet/LocalAI/pkg/grpc/proto"`
refactor: backend/service split, channel-based llm flow (#1963) Refactor: channel based llm flow and services split --------- Signed-off-by: Dave Lee <dave@gray101.com> 2024-04-13 07:45:34 +00:00			`"github.com/go-skynet/LocalAI/pkg/model"`
Revert "[Refactor]: Core/API Split" (#1550) Revert "[Refactor]: Core/API Split (#1506)" This reverts commit ab7b4d5ee9448e533a342bd1771393acd2967191. 2024-01-05 17:04:46 +00:00			`)`

refactor: backend/service split, channel-based llm flow (#1963) Refactor: channel based llm flow and services split --------- Signed-off-by: Dave Lee <dave@gray101.com> 2024-04-13 07:45:34 +00:00			`type TranscriptionBackendService struct {`
			`ml *model.ModelLoader`
			`bcl *config.BackendConfigLoader`
			`appConfig *config.ApplicationConfig`
			`}`

			`func NewTranscriptionBackendService(ml model.ModelLoader, bcl config.BackendConfigLoader, appConfig config.ApplicationConfig) TranscriptionBackendService {`
			`return &TranscriptionBackendService{`
			`ml: ml,`
			`bcl: bcl,`
			`appConfig: appConfig,`
			`}`
			`}`

			`func (tbs TranscriptionBackendService) Transcribe(request schema.OpenAIRequest) <-chan concurrency.ErrorOr[*schema.TranscriptionResult] {`
			`responseChannel := make(chan concurrency.ErrorOr[*schema.TranscriptionResult])`
			`go func(request *schema.OpenAIRequest) {`
			`bc, request, err := tbs.bcl.LoadBackendConfigForModelAndOpenAIRequest(request.Model, request, tbs.appConfig)`
			`if err != nil {`
			`responseChannel <- concurrency.ErrorOr[*schema.TranscriptionResult]{Error: fmt.Errorf("failed reading parameters from request:%w", err)}`
			`close(responseChannel)`
			`return`
			`}`

			`tr, err := modelTranscription(request.File, request.Language, tbs.ml, bc, tbs.appConfig)`
			`if err != nil {`
			`responseChannel <- concurrency.ErrorOr[*schema.TranscriptionResult]{Error: err}`
			`close(responseChannel)`
			`return`
			`}`
			`responseChannel <- concurrency.ErrorOr[*schema.TranscriptionResult]{Value: tr}`
			`close(responseChannel)`
			`}(request)`
			`return responseChannel`
			`}`

			`func modelTranscription(audio, language string, ml model.ModelLoader, backendConfig config.BackendConfig, appConfig config.ApplicationConfig) (schema.TranscriptionResult, error) {`
Revert "[Refactor]: Core/API Split" (#1550) Revert "[Refactor]: Core/API Split (#1506)" This reverts commit ab7b4d5ee9448e533a342bd1771393acd2967191. 2024-01-05 17:04:46 +00:00
refactor: move remaining api packages to core (#1731) * core 1 * api/openai/files fix * core 2 - core/config * move over core api.go and tests to the start of core/http * move over localai specific endpoints to core/http, begin the service/endpoint split there * refactor big chunk on the plane * refactor chunk 2 on plane, next step: port and modify changes to request.go * easy fixes for request.go, major changes not done yet * lintfix * json tag lintfix? * gitignore and .keep files * strange fix attempt: rename the config dir? 2024-03-01 15:19:53 +00:00			`opts := modelOpts(backendConfig, appConfig, []model.Option{`
Revert "[Refactor]: Core/API Split" (#1550) Revert "[Refactor]: Core/API Split (#1506)" This reverts commit ab7b4d5ee9448e533a342bd1771393acd2967191. 2024-01-05 17:04:46 +00:00			`model.WithBackendString(model.WhisperBackend),`
refactor: move remaining api packages to core (#1731) * core 1 * api/openai/files fix * core 2 - core/config * move over core api.go and tests to the start of core/http * move over localai specific endpoints to core/http, begin the service/endpoint split there * refactor big chunk on the plane * refactor chunk 2 on plane, next step: port and modify changes to request.go * easy fixes for request.go, major changes not done yet * lintfix * json tag lintfix? * gitignore and .keep files * strange fix attempt: rename the config dir? 2024-03-01 15:19:53 +00:00			`model.WithModel(backendConfig.Model),`
			`model.WithContext(appConfig.Context),`
fix(config): set better defaults for inferencing (#1822) * fix(defaults): set better defaults for inferencing This changeset aim to have better defaults and to properly detect when no inference settings are provided with the model. If not specified, we defaults to mirostat sampling, and offload all the GPU layers (if a GPU is detected). Related to https://github.com/mudler/LocalAI/issues/1373 and https://github.com/mudler/LocalAI/issues/1723 * Adapt tests * Also pre-initialize default seed 2024-03-13 09:05:30 +00:00			`model.WithThreads(uint32(*backendConfig.Threads)),`
refactor: move remaining api packages to core (#1731) * core 1 * api/openai/files fix * core 2 - core/config * move over core api.go and tests to the start of core/http * move over localai specific endpoints to core/http, begin the service/endpoint split there * refactor big chunk on the plane * refactor chunk 2 on plane, next step: port and modify changes to request.go * easy fixes for request.go, major changes not done yet * lintfix * json tag lintfix? * gitignore and .keep files * strange fix attempt: rename the config dir? 2024-03-01 15:19:53 +00:00			`model.WithAssetDir(appConfig.AssetsDestination),`
Revert "[Refactor]: Core/API Split" (#1550) Revert "[Refactor]: Core/API Split (#1506)" This reverts commit ab7b4d5ee9448e533a342bd1771393acd2967191. 2024-01-05 17:04:46 +00:00			`})`

refactor: move remaining api packages to core (#1731) * core 1 * api/openai/files fix * core 2 - core/config * move over core api.go and tests to the start of core/http * move over localai specific endpoints to core/http, begin the service/endpoint split there * refactor big chunk on the plane * refactor chunk 2 on plane, next step: port and modify changes to request.go * easy fixes for request.go, major changes not done yet * lintfix * json tag lintfix? * gitignore and .keep files * strange fix attempt: rename the config dir? 2024-03-01 15:19:53 +00:00			`whisperModel, err := ml.BackendLoader(opts...)`
Revert "[Refactor]: Core/API Split" (#1550) Revert "[Refactor]: Core/API Split (#1506)" This reverts commit ab7b4d5ee9448e533a342bd1771393acd2967191. 2024-01-05 17:04:46 +00:00			`if err != nil {`
			`return nil, err`
			`}`

			`if whisperModel == nil {`
			`return nil, fmt.Errorf("could not load whisper model")`
			`}`

			`return whisperModel.AudioTranscription(context.Background(), &proto.TranscriptRequest{`
			`Dst: audio,`
			`Language: language,`
fix(config): set better defaults for inferencing (#1822) * fix(defaults): set better defaults for inferencing This changeset aim to have better defaults and to properly detect when no inference settings are provided with the model. If not specified, we defaults to mirostat sampling, and offload all the GPU layers (if a GPU is detected). Related to https://github.com/mudler/LocalAI/issues/1373 and https://github.com/mudler/LocalAI/issues/1723 * Adapt tests * Also pre-initialize default seed 2024-03-13 09:05:30 +00:00			`Threads: uint32(*backendConfig.Threads),`
Revert "[Refactor]: Core/API Split" (#1550) Revert "[Refactor]: Core/API Split (#1506)" This reverts commit ab7b4d5ee9448e533a342bd1771393acd2967191. 2024-01-05 17:04:46 +00:00			`})`
			`}`