LocalAI/core/http/endpoints/openai/embeddings.go

package openai

import (
	"encoding/json"
	"fmt"
	"time"

	"github.com/go-skynet/LocalAI/core/backend"
	"github.com/go-skynet/LocalAI/core/config"
	"github.com/go-skynet/LocalAI/pkg/model"

	"github.com/go-skynet/LocalAI/core/schema"
	"github.com/google/uuid"

	"github.com/gofiber/fiber/v2"
	"github.com/rs/zerolog/log"
)

// EmbeddingsEndpoint is the OpenAI Embeddings API endpoint https://platform.openai.com/docs/api-reference/embeddings
// @Summary Get a vector representation of a given input that can be easily consumed by machine learning models and algorithms.
// @Param request body schema.OpenAIRequest true "query params"
// @Success 200 {object} schema.OpenAIResponse "Response"
// @Router /v1/embeddings [post]
func EmbeddingsEndpoint(cl *config.BackendConfigLoader, ml *model.ModelLoader, appConfig *config.ApplicationConfig) func(c *fiber.Ctx) error {
	return func(c *fiber.Ctx) error {
		model, input, err := readRequest(c, ml, appConfig, true)
		if err != nil {
			return fmt.Errorf("failed reading parameters from request:%w", err)
		}

		config, input, err := mergeRequestWithConfig(model, input, cl, ml, appConfig.Debug, appConfig.Threads, appConfig.ContextSize, appConfig.F16)
		if err != nil {
			return fmt.Errorf("failed reading parameters from request:%w", err)
		}

		log.Debug().Msgf("Parameter Config: %+v", config)
		items := []schema.Item{}

		for i, s := range config.InputToken {
			// get the model function to call for the result
			embedFn, err := backend.ModelEmbedding("", s, ml, *config, appConfig)
			if err != nil {
				return err
			}

			embeddings, err := embedFn()
			if err != nil {
				return err
			}
			items = append(items, schema.Item{Embedding: embeddings, Index: i, Object: "embedding"})
		}

		for i, s := range config.InputStrings {
			// get the model function to call for the result
			embedFn, err := backend.ModelEmbedding(s, []int{}, ml, *config, appConfig)
			if err != nil {
				return err
			}

			embeddings, err := embedFn()
			if err != nil {
				return err
			}
			items = append(items, schema.Item{Embedding: embeddings, Index: i, Object: "embedding"})
		}

		id := uuid.New().String()
		created := int(time.Now().Unix())
		resp := &schema.OpenAIResponse{
			ID:      id,
			Created: created,
			Model:   input.Model, // we have to return what the user sent here, due to OpenAI spec.
			Data:    items,
			Object:  "list",
		}

		jsonResult, _ := json.Marshal(resp)
		log.Debug().Msgf("Response: %s", jsonResult)

		// Return the prediction in the response body
		return c.JSON(resp)
	}
}
Revert "[Refactor]: Core/API Split" (#1550) Revert "[Refactor]: Core/API Split (#1506)" This reverts commit ab7b4d5ee9448e533a342bd1771393acd2967191. 2024-01-05 17:04:46 +00:00			`package openai`

			`import (`
			`"encoding/json"`
			`"fmt"`
			`"time"`

MQTT Startup Refactoring Part 1: core/ packages part 1 (#1728) This PR specifically introduces a `core` folder and moves the following packages over, without any other changes: - `api/backend` - `api/config` - `api/options` - `api/schema` Once this is merged and we confirm there's no regressions, I can migrate over the remaining changes piece by piece to split up application startup, backend services, http, and mqtt as was the goal of the earlier PRs! 2024-02-21 01:21:19 +00:00			`"github.com/go-skynet/LocalAI/core/backend"`
refactor: move remaining api packages to core (#1731) * core 1 * api/openai/files fix * core 2 - core/config * move over core api.go and tests to the start of core/http * move over localai specific endpoints to core/http, begin the service/endpoint split there * refactor big chunk on the plane * refactor chunk 2 on plane, next step: port and modify changes to request.go * easy fixes for request.go, major changes not done yet * lintfix * json tag lintfix? * gitignore and .keep files * strange fix attempt: rename the config dir? 2024-03-01 15:19:53 +00:00			`"github.com/go-skynet/LocalAI/core/config"`
			`"github.com/go-skynet/LocalAI/pkg/model"`

MQTT Startup Refactoring Part 1: core/ packages part 1 (#1728) This PR specifically introduces a `core` folder and moves the following packages over, without any other changes: - `api/backend` - `api/config` - `api/options` - `api/schema` Once this is merged and we confirm there's no regressions, I can migrate over the remaining changes piece by piece to split up application startup, backend services, http, and mqtt as was the goal of the earlier PRs! 2024-02-21 01:21:19 +00:00			`"github.com/go-skynet/LocalAI/core/schema"`
Revert "[Refactor]: Core/API Split" (#1550) Revert "[Refactor]: Core/API Split (#1506)" This reverts commit ab7b4d5ee9448e533a342bd1771393acd2967191. 2024-01-05 17:04:46 +00:00			`"github.com/google/uuid"`

			`"github.com/gofiber/fiber/v2"`
			`"github.com/rs/zerolog/log"`
			`)`

feat(swagger): Add swagger API doc (#1926) * makefile(build): add minimal and api build target * feat(swagger): Add swagger 2024-03-29 21:29:33 +00:00			`// EmbeddingsEndpoint is the OpenAI Embeddings API endpoint https://platform.openai.com/docs/api-reference/embeddings`
			`// @Summary Get a vector representation of a given input that can be easily consumed by machine learning models and algorithms.`
			`// @Param request body schema.OpenAIRequest true "query params"`
			`// @Success 200 {object} schema.OpenAIResponse "Response"`
			`// @Router /v1/embeddings [post]`
refactor: move remaining api packages to core (#1731) * core 1 * api/openai/files fix * core 2 - core/config * move over core api.go and tests to the start of core/http * move over localai specific endpoints to core/http, begin the service/endpoint split there * refactor big chunk on the plane * refactor chunk 2 on plane, next step: port and modify changes to request.go * easy fixes for request.go, major changes not done yet * lintfix * json tag lintfix? * gitignore and .keep files * strange fix attempt: rename the config dir? 2024-03-01 15:19:53 +00:00			`func EmbeddingsEndpoint(cl config.BackendConfigLoader, ml model.ModelLoader, appConfig config.ApplicationConfig) func(c fiber.Ctx) error {`
Revert "[Refactor]: Core/API Split" (#1550) Revert "[Refactor]: Core/API Split (#1506)" This reverts commit ab7b4d5ee9448e533a342bd1771393acd2967191. 2024-01-05 17:04:46 +00:00			`return func(c *fiber.Ctx) error {`
refactor: move remaining api packages to core (#1731) * core 1 * api/openai/files fix * core 2 - core/config * move over core api.go and tests to the start of core/http * move over localai specific endpoints to core/http, begin the service/endpoint split there * refactor big chunk on the plane * refactor chunk 2 on plane, next step: port and modify changes to request.go * easy fixes for request.go, major changes not done yet * lintfix * json tag lintfix? * gitignore and .keep files * strange fix attempt: rename the config dir? 2024-03-01 15:19:53 +00:00			`model, input, err := readRequest(c, ml, appConfig, true)`
Revert "[Refactor]: Core/API Split" (#1550) Revert "[Refactor]: Core/API Split (#1506)" This reverts commit ab7b4d5ee9448e533a342bd1771393acd2967191. 2024-01-05 17:04:46 +00:00			`if err != nil {`
			`return fmt.Errorf("failed reading parameters from request:%w", err)`
			`}`

refactor: move remaining api packages to core (#1731) * core 1 * api/openai/files fix * core 2 - core/config * move over core api.go and tests to the start of core/http * move over localai specific endpoints to core/http, begin the service/endpoint split there * refactor big chunk on the plane * refactor chunk 2 on plane, next step: port and modify changes to request.go * easy fixes for request.go, major changes not done yet * lintfix * json tag lintfix? * gitignore and .keep files * strange fix attempt: rename the config dir? 2024-03-01 15:19:53 +00:00			`config, input, err := mergeRequestWithConfig(model, input, cl, ml, appConfig.Debug, appConfig.Threads, appConfig.ContextSize, appConfig.F16)`
Revert "[Refactor]: Core/API Split" (#1550) Revert "[Refactor]: Core/API Split (#1506)" This reverts commit ab7b4d5ee9448e533a342bd1771393acd2967191. 2024-01-05 17:04:46 +00:00			`if err != nil {`
			`return fmt.Errorf("failed reading parameters from request:%w", err)`
			`}`

			`log.Debug().Msgf("Parameter Config: %+v", config)`
			`items := []schema.Item{}`

			`for i, s := range config.InputToken {`
			`// get the model function to call for the result`
refactor: move remaining api packages to core (#1731) * core 1 * api/openai/files fix * core 2 - core/config * move over core api.go and tests to the start of core/http * move over localai specific endpoints to core/http, begin the service/endpoint split there * refactor big chunk on the plane * refactor chunk 2 on plane, next step: port and modify changes to request.go * easy fixes for request.go, major changes not done yet * lintfix * json tag lintfix? * gitignore and .keep files * strange fix attempt: rename the config dir? 2024-03-01 15:19:53 +00:00			`embedFn, err := backend.ModelEmbedding("", s, ml, *config, appConfig)`
Revert "[Refactor]: Core/API Split" (#1550) Revert "[Refactor]: Core/API Split (#1506)" This reverts commit ab7b4d5ee9448e533a342bd1771393acd2967191. 2024-01-05 17:04:46 +00:00			`if err != nil {`
			`return err`
			`}`

			`embeddings, err := embedFn()`
			`if err != nil {`
			`return err`
			`}`
			`items = append(items, schema.Item{Embedding: embeddings, Index: i, Object: "embedding"})`
			`}`

			`for i, s := range config.InputStrings {`
			`// get the model function to call for the result`
refactor: move remaining api packages to core (#1731) * core 1 * api/openai/files fix * core 2 - core/config * move over core api.go and tests to the start of core/http * move over localai specific endpoints to core/http, begin the service/endpoint split there * refactor big chunk on the plane * refactor chunk 2 on plane, next step: port and modify changes to request.go * easy fixes for request.go, major changes not done yet * lintfix * json tag lintfix? * gitignore and .keep files * strange fix attempt: rename the config dir? 2024-03-01 15:19:53 +00:00			`embedFn, err := backend.ModelEmbedding(s, []int{}, ml, *config, appConfig)`
Revert "[Refactor]: Core/API Split" (#1550) Revert "[Refactor]: Core/API Split (#1506)" This reverts commit ab7b4d5ee9448e533a342bd1771393acd2967191. 2024-01-05 17:04:46 +00:00			`if err != nil {`
			`return err`
			`}`

			`embeddings, err := embedFn()`
			`if err != nil {`
			`return err`
			`}`
			`items = append(items, schema.Item{Embedding: embeddings, Index: i, Object: "embedding"})`
			`}`

			`id := uuid.New().String()`
			`created := int(time.Now().Unix())`
			`resp := &schema.OpenAIResponse{`
			`ID: id,`
			`Created: created,`
			`Model: input.Model, // we have to return what the user sent here, due to OpenAI spec.`
			`Data: items,`
			`Object: "list",`
			`}`

			`jsonResult, _ := json.Marshal(resp)`
			`log.Debug().Msgf("Response: %s", jsonResult)`

			`// Return the prediction in the response body`
			`return c.JSON(resp)`
			`}`
			`}`