LocalAI/api.go

package main

import (
	"embed"
	"net/http"
	"strconv"

	llama "github.com/go-skynet/llama/go"
	"github.com/gofiber/fiber/v2"
	"github.com/gofiber/fiber/v2/middleware/filesystem"
)

//go:embed index.html
var indexHTML embed.FS

func api(l *llama.LLama, listenAddr string, threads int) error {
	app := fiber.New()
	app.Use("/", filesystem.New(filesystem.Config{
		Root:         http.FS(indexHTML),
		NotFoundFile: "index.html",
	}))
	/*
		curl --location --request POST 'http://localhost:8080/predict' --header 'Content-Type: application/json' --data-raw '{
		    "text": "What is an alpaca?",
		    "topP": 0.8,
		    "topK": 50,
		    "temperature": 0.7,
		    "tokens": 100
		}'
	*/

	// Endpoint to generate the prediction
	app.Post("/predict", func(c *fiber.Ctx) error {
		// Get input data from the request body
		input := new(struct {
			Text string `json:"text"`
		})
		if err := c.BodyParser(input); err != nil {
			return err
		}

		// Set the parameters for the language model prediction
		topP, err := strconv.ParseFloat(c.Query("topP", "0.9"), 64) // Default value of topP is 0.9
		if err != nil {
			return err
		}

		topK, err := strconv.Atoi(c.Query("topK", "40")) // Default value of topK is 40
		if err != nil {
			return err
		}

		temperature, err := strconv.ParseFloat(c.Query("temperature", "0.5"), 64) // Default value of temperature is 0.5
		if err != nil {
			return err
		}

		tokens, err := strconv.Atoi(c.Query("tokens", "128")) // Default value of tokens is 128
		if err != nil {
			return err
		}

		// Generate the prediction using the language model
		prediction, err := l.Predict(
			input.Text,
			llama.SetTemperature(temperature),
			llama.SetTopP(topP),
			llama.SetTopK(topK),
			llama.SetTokens(tokens),
			llama.SetThreads(threads),
		)
		if err != nil {
			return err
		}

		// Return the prediction in the response body
		return c.JSON(struct {
			Prediction string `json:"prediction"`
		}{
			Prediction: prediction,
		})
	})

	// Start the server
	app.Listen(":8080")
	return nil
}
First import 2023-03-18 22:59:06 +00:00			`package main`

			`import (`
Add a simple web-page as index of the API for helping with inference testing 2023-03-25 00:09:51 +00:00			`"embed"`
			`"net/http"`
First import 2023-03-18 22:59:06 +00:00			`"strconv"`

			`llama "github.com/go-skynet/llama/go"`
			`"github.com/gofiber/fiber/v2"`
Add a simple web-page as index of the API for helping with inference testing 2023-03-25 00:09:51 +00:00			`"github.com/gofiber/fiber/v2/middleware/filesystem"`
First import 2023-03-18 22:59:06 +00:00			`)`

Add a simple web-page as index of the API for helping with inference testing 2023-03-25 00:09:51 +00:00			`//go:embed index.html`
			`var indexHTML embed.FS`

Update llama-go, allow to set context-size and enable alpaca model by default 2023-03-21 18:20:23 +00:00			`func api(l *llama.LLama, listenAddr string, threads int) error {`
First import 2023-03-18 22:59:06 +00:00			`app := fiber.New()`
Add a simple web-page as index of the API for helping with inference testing 2023-03-25 00:09:51 +00:00			`app.Use("/", filesystem.New(filesystem.Config{`
			`Root: http.FS(indexHTML),`
			`NotFoundFile: "index.html",`
			`}))`
First import 2023-03-18 22:59:06 +00:00			`/*`
			`curl --location --request POST 'http://localhost:8080/predict' --header 'Content-Type: application/json' --data-raw '{`
			`"text": "What is an alpaca?",`
			`"topP": 0.8,`
			`"topK": 50,`
			`"temperature": 0.7,`
			`"tokens": 100`
			`}'`
			`*/`

			`// Endpoint to generate the prediction`
			`app.Post("/predict", func(c *fiber.Ctx) error {`
			`// Get input data from the request body`
			`input := new(struct {`
			Text string `json:"text"`
			`})`
			`if err := c.BodyParser(input); err != nil {`
			`return err`
			`}`

			`// Set the parameters for the language model prediction`
			`topP, err := strconv.ParseFloat(c.Query("topP", "0.9"), 64) // Default value of topP is 0.9`
			`if err != nil {`
			`return err`
			`}`

			`topK, err := strconv.Atoi(c.Query("topK", "40")) // Default value of topK is 40`
			`if err != nil {`
			`return err`
			`}`

			`temperature, err := strconv.ParseFloat(c.Query("temperature", "0.5"), 64) // Default value of temperature is 0.5`
			`if err != nil {`
			`return err`
			`}`

			`tokens, err := strconv.Atoi(c.Query("tokens", "128")) // Default value of tokens is 128`
			`if err != nil {`
			`return err`
			`}`

			`// Generate the prediction using the language model`
			`prediction, err := l.Predict(`
			`input.Text,`
			`llama.SetTemperature(temperature),`
			`llama.SetTopP(topP),`
			`llama.SetTopK(topK),`
			`llama.SetTokens(tokens),`
			`llama.SetThreads(threads),`
			`)`
			`if err != nil {`
			`return err`
			`}`

			`// Return the prediction in the response body`
			`return c.JSON(struct {`
			Prediction string `json:"prediction"`
			`}{`
			`Prediction: prediction,`
			`})`
			`})`

			`// Start the server`
			`app.Listen(":8080")`
			`return nil`
			`}`