@ -431,20 +431,22 @@ type ModelOptions struct {
sizeCache protoimpl . SizeCache
unknownFields protoimpl . UnknownFields
Model string ` protobuf:"bytes,1,opt,name=Model,proto3" json:"Model,omitempty" `
ContextSize int32 ` protobuf:"varint,2,opt,name=ContextSize,proto3" json:"ContextSize,omitempty" `
Seed int32 ` protobuf:"varint,3,opt,name=Seed,proto3" json:"Seed,omitempty" `
NBatch int32 ` protobuf:"varint,4,opt,name=NBatch,proto3" json:"NBatch,omitempty" `
F16Memory bool ` protobuf:"varint,5,opt,name=F16Memory,proto3" json:"F16Memory,omitempty" `
MLock bool ` protobuf:"varint,6,opt,name=MLock,proto3" json:"MLock,omitempty" `
MMap bool ` protobuf:"varint,7,opt,name=MMap,proto3" json:"MMap,omitempty" `
VocabOnly bool ` protobuf:"varint,8,opt,name=VocabOnly,proto3" json:"VocabOnly,omitempty" `
LowVRAM bool ` protobuf:"varint,9,opt,name=LowVRAM,proto3" json:"LowVRAM,omitempty" `
Embeddings bool ` protobuf:"varint,10,opt,name=Embeddings,proto3" json:"Embeddings,omitempty" `
NUMA bool ` protobuf:"varint,11,opt,name=NUMA,proto3" json:"NUMA,omitempty" `
NGPULayers int32 ` protobuf:"varint,12,opt,name=NGPULayers,proto3" json:"NGPULayers,omitempty" `
MainGPU string ` protobuf:"bytes,13,opt,name=MainGPU,proto3" json:"MainGPU,omitempty" `
TensorSplit string ` protobuf:"bytes,14,opt,name=TensorSplit,proto3" json:"TensorSplit,omitempty" `
Model string ` protobuf:"bytes,1,opt,name=Model,proto3" json:"Model,omitempty" `
ContextSize int32 ` protobuf:"varint,2,opt,name=ContextSize,proto3" json:"ContextSize,omitempty" `
Seed int32 ` protobuf:"varint,3,opt,name=Seed,proto3" json:"Seed,omitempty" `
NBatch int32 ` protobuf:"varint,4,opt,name=NBatch,proto3" json:"NBatch,omitempty" `
F16Memory bool ` protobuf:"varint,5,opt,name=F16Memory,proto3" json:"F16Memory,omitempty" `
MLock bool ` protobuf:"varint,6,opt,name=MLock,proto3" json:"MLock,omitempty" `
MMap bool ` protobuf:"varint,7,opt,name=MMap,proto3" json:"MMap,omitempty" `
VocabOnly bool ` protobuf:"varint,8,opt,name=VocabOnly,proto3" json:"VocabOnly,omitempty" `
LowVRAM bool ` protobuf:"varint,9,opt,name=LowVRAM,proto3" json:"LowVRAM,omitempty" `
Embeddings bool ` protobuf:"varint,10,opt,name=Embeddings,proto3" json:"Embeddings,omitempty" `
NUMA bool ` protobuf:"varint,11,opt,name=NUMA,proto3" json:"NUMA,omitempty" `
NGPULayers int32 ` protobuf:"varint,12,opt,name=NGPULayers,proto3" json:"NGPULayers,omitempty" `
MainGPU string ` protobuf:"bytes,13,opt,name=MainGPU,proto3" json:"MainGPU,omitempty" `
TensorSplit string ` protobuf:"bytes,14,opt,name=TensorSplit,proto3" json:"TensorSplit,omitempty" `
Threads int32 ` protobuf:"varint,15,opt,name=Threads,proto3" json:"Threads,omitempty" `
LibrarySearchPath string ` protobuf:"bytes,16,opt,name=LibrarySearchPath,proto3" json:"LibrarySearchPath,omitempty" `
}
func ( x * ModelOptions ) Reset ( ) {
@ -577,6 +579,20 @@ func (x *ModelOptions) GetTensorSplit() string {
return ""
}
func ( x * ModelOptions ) GetThreads ( ) int32 {
if x != nil {
return x . Threads
}
return 0
}
func ( x * ModelOptions ) GetLibrarySearchPath ( ) string {
if x != nil {
return x . LibrarySearchPath
}
return ""
}
type Result struct {
state protoimpl . MessageState
sizeCache protoimpl . SizeCache
@ -753,7 +769,7 @@ var file_pkg_grpc_proto_llmserver_proto_rawDesc = []byte{
0x65 , 0x64 , 0x64 , 0x69 , 0x6e , 0x67 , 0x73 , 0x18 , 0x24 , 0x20 , 0x01 , 0x28 , 0x09 , 0x52 , 0x0a , 0x45 ,
0x6d , 0x62 , 0x65 , 0x64 , 0x64 , 0x69 , 0x6e , 0x67 , 0x73 , 0x22 , 0x21 , 0x0a , 0x05 , 0x52 , 0x65 , 0x70 ,
0x6c , 0x79 , 0x12 , 0x18 , 0x0a , 0x07 , 0x6d , 0x65 , 0x73 , 0x73 , 0x61 , 0x67 , 0x65 , 0x18 , 0x01 , 0x20 ,
0x01 , 0x28 , 0x09 , 0x52 , 0x07 , 0x6d , 0x65 , 0x73 , 0x73 , 0x61 , 0x67 , 0x65 , 0x22 , 0x82 , 0x03 , 0x0a ,
0x01 , 0x28 , 0x09 , 0x52 , 0x07 , 0x6d , 0x65 , 0x73 , 0x73 , 0x61 , 0x67 , 0x65 , 0x22 , 0xca , 0x03 , 0x0a ,
0x0c , 0x4d , 0x6f , 0x64 , 0x65 , 0x6c , 0x4f , 0x70 , 0x74 , 0x69 , 0x6f , 0x6e , 0x73 , 0x12 , 0x14 , 0x0a ,
0x05 , 0x4d , 0x6f , 0x64 , 0x65 , 0x6c , 0x18 , 0x01 , 0x20 , 0x01 , 0x28 , 0x09 , 0x52 , 0x05 , 0x4d , 0x6f ,
0x64 , 0x65 , 0x6c , 0x12 , 0x20 , 0x0a , 0x0b , 0x43 , 0x6f , 0x6e , 0x74 , 0x65 , 0x78 , 0x74 , 0x53 , 0x69 ,
@ -778,36 +794,40 @@ var file_pkg_grpc_proto_llmserver_proto_rawDesc = []byte{
0x18 , 0x0d , 0x20 , 0x01 , 0x28 , 0x09 , 0x52 , 0x07 , 0x4d , 0x61 , 0x69 , 0x6e , 0x47 , 0x50 , 0x55 , 0x12 ,
0x20 , 0x0a , 0x0b , 0x54 , 0x65 , 0x6e , 0x73 , 0x6f , 0x72 , 0x53 , 0x70 , 0x6c , 0x69 , 0x74 , 0x18 , 0x0e ,
0x20 , 0x01 , 0x28 , 0x09 , 0x52 , 0x0b , 0x54 , 0x65 , 0x6e , 0x73 , 0x6f , 0x72 , 0x53 , 0x70 , 0x6c , 0x69 ,
0x74 , 0x22 , 0x3c , 0x0a , 0x06 , 0x52 , 0x65 , 0x73 , 0x75 , 0x6c , 0x74 , 0x12 , 0x18 , 0x0a , 0x07 , 0x6d ,
0x65 , 0x73 , 0x73 , 0x61 , 0x67 , 0x65 , 0x18 , 0x01 , 0x20 , 0x01 , 0x28 , 0x09 , 0x52 , 0x07 , 0x6d , 0x65 ,
0x73 , 0x73 , 0x61 , 0x67 , 0x65 , 0x12 , 0x18 , 0x0a , 0x07 , 0x73 , 0x75 , 0x63 , 0x63 , 0x65 , 0x73 , 0x73 ,
0x18 , 0x02 , 0x20 , 0x01 , 0x28 , 0x08 , 0x52 , 0x07 , 0x73 , 0x75 , 0x63 , 0x63 , 0x65 , 0x73 , 0x73 , 0x22 ,
0x31 , 0x0a , 0x0f , 0x45 , 0x6d , 0x62 , 0x65 , 0x64 , 0x64 , 0x69 , 0x6e , 0x67 , 0x52 , 0x65 , 0x73 , 0x75 ,
0x6c , 0x74 , 0x12 , 0x1e , 0x0a , 0x0a , 0x65 , 0x6d , 0x62 , 0x65 , 0x64 , 0x64 , 0x69 , 0x6e , 0x67 , 0x73 ,
0x18 , 0x01 , 0x20 , 0x03 , 0x28 , 0x02 , 0x52 , 0x0a , 0x65 , 0x6d , 0x62 , 0x65 , 0x64 , 0x64 , 0x69 , 0x6e ,
0x67 , 0x73 , 0x32 , 0xfe , 0x01 , 0x0a , 0x03 , 0x4c , 0x4c , 0x4d , 0x12 , 0x2a , 0x0a , 0x06 , 0x48 , 0x65 ,
0x61 , 0x6c , 0x74 , 0x68 , 0x12 , 0x12 , 0x2e , 0x6c , 0x6c , 0x6d , 0x2e , 0x48 , 0x65 , 0x61 , 0x6c , 0x74 ,
0x68 , 0x4d , 0x65 , 0x73 , 0x73 , 0x61 , 0x67 , 0x65 , 0x1a , 0x0a , 0x2e , 0x6c , 0x6c , 0x6d , 0x2e , 0x52 ,
0x65 , 0x70 , 0x6c , 0x79 , 0x22 , 0x00 , 0x12 , 0x2c , 0x0a , 0x07 , 0x50 , 0x72 , 0x65 , 0x64 , 0x69 , 0x63 ,
0x74 , 0x12 , 0x13 , 0x2e , 0x6c , 0x6c , 0x6d , 0x2e , 0x50 , 0x72 , 0x65 , 0x64 , 0x69 , 0x63 , 0x74 , 0x4f ,
0x70 , 0x74 , 0x69 , 0x6f , 0x6e , 0x73 , 0x1a , 0x0a , 0x2e , 0x6c , 0x6c , 0x6d , 0x2e , 0x52 , 0x65 , 0x70 ,
0x6c , 0x79 , 0x22 , 0x00 , 0x12 , 0x2d , 0x0a , 0x09 , 0x4c , 0x6f , 0x61 , 0x64 , 0x4d , 0x6f , 0x64 , 0x65 ,
0x6c , 0x12 , 0x11 , 0x2e , 0x6c , 0x6c , 0x6d , 0x2e , 0x4d , 0x6f , 0x64 , 0x65 , 0x6c , 0x4f , 0x70 , 0x74 ,
0x69 , 0x6f , 0x6e , 0x73 , 0x1a , 0x0b , 0x2e , 0x6c , 0x6c , 0x6d , 0x2e , 0x52 , 0x65 , 0x73 , 0x75 , 0x6c ,
0x74 , 0x22 , 0x00 , 0x12 , 0x34 , 0x0a , 0x0d , 0x50 , 0x72 , 0x65 , 0x64 , 0x69 , 0x63 , 0x74 , 0x53 , 0x74 ,
0x72 , 0x65 , 0x61 , 0x6d , 0x12 , 0x13 , 0x2e , 0x6c , 0x6c , 0x6d , 0x2e , 0x50 , 0x72 , 0x65 , 0x64 , 0x69 ,
0x63 , 0x74 , 0x4f , 0x70 , 0x74 , 0x69 , 0x6f , 0x6e , 0x73 , 0x1a , 0x0a , 0x2e , 0x6c , 0x6c , 0x6d , 0x2e ,
0x52 , 0x65 , 0x70 , 0x6c , 0x79 , 0x22 , 0x00 , 0x30 , 0x01 , 0x12 , 0x38 , 0x0a , 0x09 , 0x45 , 0x6d , 0x62 ,
0x65 , 0x64 , 0x64 , 0x69 , 0x6e , 0x67 , 0x12 , 0x13 , 0x2e , 0x6c , 0x6c , 0x6d , 0x2e , 0x50 , 0x72 , 0x65 ,
0x64 , 0x69 , 0x63 , 0x74 , 0x4f , 0x70 , 0x74 , 0x69 , 0x6f , 0x6e , 0x73 , 0x1a , 0x14 , 0x2e , 0x6c , 0x6c ,
0x6d , 0x2e , 0x45 , 0x6d , 0x62 , 0x65 , 0x64 , 0x64 , 0x69 , 0x6e , 0x67 , 0x52 , 0x65 , 0x73 , 0x75 , 0x6c ,
0x74 , 0x22 , 0x00 , 0x42 , 0x57 , 0x0a , 0x1b , 0x69 , 0x6f , 0x2e , 0x73 , 0x6b , 0x79 , 0x6e , 0x65 , 0x74 ,
0x2e , 0x6c , 0x6f , 0x63 , 0x61 , 0x6c , 0x61 , 0x69 , 0x2e , 0x6c , 0x6c , 0x6d , 0x73 , 0x65 , 0x72 , 0x76 ,
0x65 , 0x72 , 0x42 , 0x09 , 0x4c , 0x4c , 0x4d , 0x53 , 0x65 , 0x72 , 0x76 , 0x65 , 0x72 , 0x50 , 0x01 , 0x5a ,
0x2b , 0x67 , 0x69 , 0x74 , 0x68 , 0x75 , 0x62 , 0x2e , 0x63 , 0x6f , 0x6d , 0x2f , 0x67 , 0x6f , 0x2d , 0x73 ,
0x6b , 0x79 , 0x6e , 0x65 , 0x74 , 0x2f , 0x4c , 0x6f , 0x63 , 0x61 , 0x6c , 0x41 , 0x49 , 0x2f , 0x70 , 0x6b ,
0x67 , 0x2f , 0x67 , 0x72 , 0x70 , 0x63 , 0x2f , 0x70 , 0x72 , 0x6f , 0x74 , 0x6f , 0x62 , 0x06 , 0x70 , 0x72 ,
0x6f , 0x74 , 0x6f , 0x33 ,
0x74 , 0x12 , 0x18 , 0x0a , 0x07 , 0x54 , 0x68 , 0x72 , 0x65 , 0x61 , 0x64 , 0x73 , 0x18 , 0x0f , 0x20 , 0x01 ,
0x28 , 0x05 , 0x52 , 0x07 , 0x54 , 0x68 , 0x72 , 0x65 , 0x61 , 0x64 , 0x73 , 0x12 , 0x2c , 0x0a , 0x11 , 0x4c ,
0x69 , 0x62 , 0x72 , 0x61 , 0x72 , 0x79 , 0x53 , 0x65 , 0x61 , 0x72 , 0x63 , 0x68 , 0x50 , 0x61 , 0x74 , 0x68 ,
0x18 , 0x10 , 0x20 , 0x01 , 0x28 , 0x09 , 0x52 , 0x11 , 0x4c , 0x69 , 0x62 , 0x72 , 0x61 , 0x72 , 0x79 , 0x53 ,
0x65 , 0x61 , 0x72 , 0x63 , 0x68 , 0x50 , 0x61 , 0x74 , 0x68 , 0x22 , 0x3c , 0x0a , 0x06 , 0x52 , 0x65 , 0x73 ,
0x75 , 0x6c , 0x74 , 0x12 , 0x18 , 0x0a , 0x07 , 0x6d , 0x65 , 0x73 , 0x73 , 0x61 , 0x67 , 0x65 , 0x18 , 0x01 ,
0x20 , 0x01 , 0x28 , 0x09 , 0x52 , 0x07 , 0x6d , 0x65 , 0x73 , 0x73 , 0x61 , 0x67 , 0x65 , 0x12 , 0x18 , 0x0a ,
0x07 , 0x73 , 0x75 , 0x63 , 0x63 , 0x65 , 0x73 , 0x73 , 0x18 , 0x02 , 0x20 , 0x01 , 0x28 , 0x08 , 0x52 , 0x07 ,
0x73 , 0x75 , 0x63 , 0x63 , 0x65 , 0x73 , 0x73 , 0x22 , 0x31 , 0x0a , 0x0f , 0x45 , 0x6d , 0x62 , 0x65 , 0x64 ,
0x64 , 0x69 , 0x6e , 0x67 , 0x52 , 0x65 , 0x73 , 0x75 , 0x6c , 0x74 , 0x12 , 0x1e , 0x0a , 0x0a , 0x65 , 0x6d ,
0x62 , 0x65 , 0x64 , 0x64 , 0x69 , 0x6e , 0x67 , 0x73 , 0x18 , 0x01 , 0x20 , 0x03 , 0x28 , 0x02 , 0x52 , 0x0a ,
0x65 , 0x6d , 0x62 , 0x65 , 0x64 , 0x64 , 0x69 , 0x6e , 0x67 , 0x73 , 0x32 , 0xfe , 0x01 , 0x0a , 0x03 , 0x4c ,
0x4c , 0x4d , 0x12 , 0x2a , 0x0a , 0x06 , 0x48 , 0x65 , 0x61 , 0x6c , 0x74 , 0x68 , 0x12 , 0x12 , 0x2e , 0x6c ,
0x6c , 0x6d , 0x2e , 0x48 , 0x65 , 0x61 , 0x6c , 0x74 , 0x68 , 0x4d , 0x65 , 0x73 , 0x73 , 0x61 , 0x67 , 0x65 ,
0x1a , 0x0a , 0x2e , 0x6c , 0x6c , 0x6d , 0x2e , 0x52 , 0x65 , 0x70 , 0x6c , 0x79 , 0x22 , 0x00 , 0x12 , 0x2c ,
0x0a , 0x07 , 0x50 , 0x72 , 0x65 , 0x64 , 0x69 , 0x63 , 0x74 , 0x12 , 0x13 , 0x2e , 0x6c , 0x6c , 0x6d , 0x2e ,
0x50 , 0x72 , 0x65 , 0x64 , 0x69 , 0x63 , 0x74 , 0x4f , 0x70 , 0x74 , 0x69 , 0x6f , 0x6e , 0x73 , 0x1a , 0x0a ,
0x2e , 0x6c , 0x6c , 0x6d , 0x2e , 0x52 , 0x65 , 0x70 , 0x6c , 0x79 , 0x22 , 0x00 , 0x12 , 0x2d , 0x0a , 0x09 ,
0x4c , 0x6f , 0x61 , 0x64 , 0x4d , 0x6f , 0x64 , 0x65 , 0x6c , 0x12 , 0x11 , 0x2e , 0x6c , 0x6c , 0x6d , 0x2e ,
0x4d , 0x6f , 0x64 , 0x65 , 0x6c , 0x4f , 0x70 , 0x74 , 0x69 , 0x6f , 0x6e , 0x73 , 0x1a , 0x0b , 0x2e , 0x6c ,
0x6c , 0x6d , 0x2e , 0x52 , 0x65 , 0x73 , 0x75 , 0x6c , 0x74 , 0x22 , 0x00 , 0x12 , 0x34 , 0x0a , 0x0d , 0x50 ,
0x72 , 0x65 , 0x64 , 0x69 , 0x63 , 0x74 , 0x53 , 0x74 , 0x72 , 0x65 , 0x61 , 0x6d , 0x12 , 0x13 , 0x2e , 0x6c ,
0x6c , 0x6d , 0x2e , 0x50 , 0x72 , 0x65 , 0x64 , 0x69 , 0x63 , 0x74 , 0x4f , 0x70 , 0x74 , 0x69 , 0x6f , 0x6e ,
0x73 , 0x1a , 0x0a , 0x2e , 0x6c , 0x6c , 0x6d , 0x2e , 0x52 , 0x65 , 0x70 , 0x6c , 0x79 , 0x22 , 0x00 , 0x30 ,
0x01 , 0x12 , 0x38 , 0x0a , 0x09 , 0x45 , 0x6d , 0x62 , 0x65 , 0x64 , 0x64 , 0x69 , 0x6e , 0x67 , 0x12 , 0x13 ,
0x2e , 0x6c , 0x6c , 0x6d , 0x2e , 0x50 , 0x72 , 0x65 , 0x64 , 0x69 , 0x63 , 0x74 , 0x4f , 0x70 , 0x74 , 0x69 ,
0x6f , 0x6e , 0x73 , 0x1a , 0x14 , 0x2e , 0x6c , 0x6c , 0x6d , 0x2e , 0x45 , 0x6d , 0x62 , 0x65 , 0x64 , 0x64 ,
0x69 , 0x6e , 0x67 , 0x52 , 0x65 , 0x73 , 0x75 , 0x6c , 0x74 , 0x22 , 0x00 , 0x42 , 0x57 , 0x0a , 0x1b , 0x69 ,
0x6f , 0x2e , 0x73 , 0x6b , 0x79 , 0x6e , 0x65 , 0x74 , 0x2e , 0x6c , 0x6f , 0x63 , 0x61 , 0x6c , 0x61 , 0x69 ,
0x2e , 0x6c , 0x6c , 0x6d , 0x73 , 0x65 , 0x72 , 0x76 , 0x65 , 0x72 , 0x42 , 0x09 , 0x4c , 0x4c , 0x4d , 0x53 ,
0x65 , 0x72 , 0x76 , 0x65 , 0x72 , 0x50 , 0x01 , 0x5a , 0x2b , 0x67 , 0x69 , 0x74 , 0x68 , 0x75 , 0x62 , 0x2e ,
0x63 , 0x6f , 0x6d , 0x2f , 0x67 , 0x6f , 0x2d , 0x73 , 0x6b , 0x79 , 0x6e , 0x65 , 0x74 , 0x2f , 0x4c , 0x6f ,
0x63 , 0x61 , 0x6c , 0x41 , 0x49 , 0x2f , 0x70 , 0x6b , 0x67 , 0x2f , 0x67 , 0x72 , 0x70 , 0x63 , 0x2f , 0x70 ,
0x72 , 0x6f , 0x74 , 0x6f , 0x62 , 0x06 , 0x70 , 0x72 , 0x6f , 0x74 , 0x6f , 0x33 ,
}
var (