You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
72 lines
1.7 KiB
72 lines
1.7 KiB
2 years ago
|
package rwkv
|
||
|
|
||
|
// This is a wrapper to statisfy the GRPC service interface
|
||
|
// It is meant to be used by the main executable that is the server for the specific backend type (falcon, gpt3, etc)
|
||
|
import (
|
||
|
"fmt"
|
||
|
"path/filepath"
|
||
|
|
||
|
"github.com/donomii/go-rwkv.cpp"
|
||
|
"github.com/go-skynet/LocalAI/pkg/grpc/base"
|
||
|
pb "github.com/go-skynet/LocalAI/pkg/grpc/proto"
|
||
|
)
|
||
|
|
||
|
const tokenizerSuffix = ".tokenizer.json"
|
||
|
|
||
|
type LLM struct {
|
||
|
base.Base
|
||
|
|
||
|
rwkv *rwkv.RwkvState
|
||
|
}
|
||
|
|
||
|
func (llm *LLM) Load(opts *pb.ModelOptions) error {
|
||
|
modelPath := filepath.Dir(opts.Model)
|
||
|
modelFile := filepath.Base(opts.Model)
|
||
|
model := rwkv.LoadFiles(opts.Model, filepath.Join(modelPath, modelFile+tokenizerSuffix), uint32(opts.GetThreads()))
|
||
|
|
||
|
if model == nil {
|
||
|
return fmt.Errorf("could not load model")
|
||
|
}
|
||
|
llm.rwkv = model
|
||
|
return nil
|
||
|
}
|
||
|
|
||
|
func (llm *LLM) Predict(opts *pb.PredictOptions) (string, error) {
|
||
|
|
||
|
stopWord := "\n"
|
||
|
if len(opts.StopPrompts) > 0 {
|
||
|
stopWord = opts.StopPrompts[0]
|
||
|
}
|
||
|
|
||
|
if err := llm.rwkv.ProcessInput(opts.Prompt); err != nil {
|
||
|
return "", err
|
||
|
}
|
||
|
|
||
|
response := llm.rwkv.GenerateResponse(int(opts.Tokens), stopWord, float32(opts.Temperature), float32(opts.TopP), nil)
|
||
|
|
||
|
return response, nil
|
||
|
}
|
||
|
|
||
|
func (llm *LLM) PredictStream(opts *pb.PredictOptions, results chan string) error {
|
||
|
go func() {
|
||
|
|
||
|
stopWord := "\n"
|
||
|
if len(opts.StopPrompts) > 0 {
|
||
|
stopWord = opts.StopPrompts[0]
|
||
|
}
|
||
|
|
||
|
if err := llm.rwkv.ProcessInput(opts.Prompt); err != nil {
|
||
|
fmt.Println("Error processing input: ", err)
|
||
|
return
|
||
|
}
|
||
|
|
||
|
llm.rwkv.GenerateResponse(int(opts.Tokens), stopWord, float32(opts.Temperature), float32(opts.TopP), func(s string) bool {
|
||
|
results <- s
|
||
|
return true
|
||
|
})
|
||
|
close(results)
|
||
|
}()
|
||
|
|
||
|
return nil
|
||
|
}
|