You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
60 lines
1.4 KiB
60 lines
1.4 KiB
1 year ago
|
package bloomz
|
||
|
|
||
|
// This is a wrapper to statisfy the GRPC service interface
|
||
|
// It is meant to be used by the main executable that is the server for the specific backend type (falcon, gpt3, etc)
|
||
|
import (
|
||
|
"fmt"
|
||
|
|
||
|
"github.com/go-skynet/LocalAI/pkg/grpc/base"
|
||
|
pb "github.com/go-skynet/LocalAI/pkg/grpc/proto"
|
||
|
|
||
|
"github.com/go-skynet/bloomz.cpp"
|
||
|
)
|
||
|
|
||
|
type LLM struct {
|
||
|
base.Base
|
||
|
|
||
|
bloomz *bloomz.Bloomz
|
||
|
}
|
||
|
|
||
|
func (llm *LLM) Load(opts *pb.ModelOptions) error {
|
||
|
model, err := bloomz.New(opts.Model)
|
||
|
llm.bloomz = model
|
||
|
return err
|
||
|
}
|
||
|
|
||
|
func buildPredictOptions(opts *pb.PredictOptions) []bloomz.PredictOption {
|
||
|
predictOptions := []bloomz.PredictOption{
|
||
|
bloomz.SetTemperature(float64(opts.Temperature)),
|
||
|
bloomz.SetTopP(float64(opts.TopP)),
|
||
|
bloomz.SetTopK(int(opts.TopK)),
|
||
|
bloomz.SetTokens(int(opts.Tokens)),
|
||
|
bloomz.SetThreads(int(opts.Threads)),
|
||
|
}
|
||
|
|
||
|
if opts.Seed != 0 {
|
||
|
predictOptions = append(predictOptions, bloomz.SetSeed(int(opts.Seed)))
|
||
|
}
|
||
|
|
||
|
return predictOptions
|
||
|
}
|
||
|
|
||
|
func (llm *LLM) Predict(opts *pb.PredictOptions) (string, error) {
|
||
|
return llm.bloomz.Predict(opts.Prompt, buildPredictOptions(opts)...)
|
||
|
}
|
||
|
|
||
|
// fallback to Predict
|
||
|
func (llm *LLM) PredictStream(opts *pb.PredictOptions, results chan string) error {
|
||
|
go func() {
|
||
|
res, err := llm.bloomz.Predict(opts.Prompt, buildPredictOptions(opts)...)
|
||
|
|
||
|
if err != nil {
|
||
|
fmt.Println("err: ", err)
|
||
|
}
|
||
|
results <- res
|
||
|
close(results)
|
||
|
}()
|
||
|
|
||
|
return nil
|
||
|
}
|