mirror of
https://github.com/mudler/LocalAI.git
synced 2024-06-07 19:40:48 +00:00
fdd95d1d86
* feat: allow to run parallel requests Signed-off-by: Ettore Di Giacinto <mudler@localai.io> * fixup Signed-off-by: Ettore Di Giacinto <mudler@localai.io> --------- Signed-off-by: Ettore Di Giacinto <mudler@localai.io>
119 lines
2.8 KiB
Go
119 lines
2.8 KiB
Go
package model
|
|
|
|
import (
|
|
"fmt"
|
|
"os"
|
|
"os/signal"
|
|
"strconv"
|
|
"strings"
|
|
"syscall"
|
|
"time"
|
|
|
|
"github.com/hpcloud/tail"
|
|
process "github.com/mudler/go-processmanager"
|
|
"github.com/rs/zerolog/log"
|
|
)
|
|
|
|
func (ml *ModelLoader) StopAllExcept(s string) {
|
|
ml.StopGRPC(func(id string, p *process.Process) bool {
|
|
if id != s {
|
|
for ml.models[id].GRPC().IsBusy() {
|
|
log.Debug().Msgf("%s busy. Waiting.", id)
|
|
time.Sleep(2 * time.Second)
|
|
}
|
|
log.Debug().Msgf("[single-backend] Stopping %s", id)
|
|
return true
|
|
}
|
|
return false
|
|
})
|
|
}
|
|
|
|
func (ml *ModelLoader) deleteProcess(s string) error {
|
|
if err := ml.grpcProcesses[s].Stop(); err != nil {
|
|
return err
|
|
}
|
|
delete(ml.grpcProcesses, s)
|
|
delete(ml.models, s)
|
|
return nil
|
|
}
|
|
|
|
type GRPCProcessFilter = func(id string, p *process.Process) bool
|
|
|
|
func includeAllProcesses(_ string, _ *process.Process) bool {
|
|
return true
|
|
}
|
|
|
|
func (ml *ModelLoader) StopGRPC(filter GRPCProcessFilter) {
|
|
for k, p := range ml.grpcProcesses {
|
|
if filter(k, p) {
|
|
ml.deleteProcess(k)
|
|
}
|
|
}
|
|
}
|
|
|
|
func (ml *ModelLoader) StopAllGRPC() {
|
|
ml.StopGRPC(includeAllProcesses)
|
|
}
|
|
|
|
func (ml *ModelLoader) GetGRPCPID(id string) (int, error) {
|
|
p, exists := ml.grpcProcesses[id]
|
|
if !exists {
|
|
return -1, fmt.Errorf("no grpc backend found for %s", id)
|
|
}
|
|
return strconv.Atoi(p.PID)
|
|
}
|
|
|
|
func (ml *ModelLoader) startProcess(grpcProcess, id string, serverAddress string) error {
|
|
// Make sure the process is executable
|
|
if err := os.Chmod(grpcProcess, 0755); err != nil {
|
|
return err
|
|
}
|
|
|
|
log.Debug().Msgf("Loading GRPC Process: %s", grpcProcess)
|
|
|
|
log.Debug().Msgf("GRPC Service for %s will be running at: '%s'", id, serverAddress)
|
|
|
|
grpcControlProcess := process.New(
|
|
process.WithTemporaryStateDir(),
|
|
process.WithName(grpcProcess),
|
|
process.WithArgs("--addr", serverAddress),
|
|
process.WithEnvironment(os.Environ()...),
|
|
)
|
|
|
|
ml.grpcProcesses[id] = grpcControlProcess
|
|
|
|
if err := grpcControlProcess.Run(); err != nil {
|
|
return err
|
|
}
|
|
|
|
log.Debug().Msgf("GRPC Service state dir: %s", grpcControlProcess.StateDir())
|
|
// clean up process
|
|
go func() {
|
|
c := make(chan os.Signal, 1)
|
|
signal.Notify(c, os.Interrupt, syscall.SIGTERM)
|
|
<-c
|
|
grpcControlProcess.Stop()
|
|
}()
|
|
|
|
go func() {
|
|
t, err := tail.TailFile(grpcControlProcess.StderrPath(), tail.Config{Follow: true})
|
|
if err != nil {
|
|
log.Debug().Msgf("Could not tail stderr")
|
|
}
|
|
for line := range t.Lines {
|
|
log.Debug().Msgf("GRPC(%s): stderr %s", strings.Join([]string{id, serverAddress}, "-"), line.Text)
|
|
}
|
|
}()
|
|
go func() {
|
|
t, err := tail.TailFile(grpcControlProcess.StdoutPath(), tail.Config{Follow: true})
|
|
if err != nil {
|
|
log.Debug().Msgf("Could not tail stdout")
|
|
}
|
|
for line := range t.Lines {
|
|
log.Debug().Msgf("GRPC(%s): stdout %s", strings.Join([]string{id, serverAddress}, "-"), line.Text)
|
|
}
|
|
}()
|
|
|
|
return nil
|
|
}
|