FlaskAI/main.go

package main

import (
	"bytes"
	"fmt"
	"io/ioutil"
	"os"
	"runtime"
	"text/template"

	llama "github.com/go-skynet/go-llama.cpp"
	"github.com/urfave/cli/v2"
)

// Define the template string
var emptyInput string = `Below is an instruction that describes a task. Write a response that appropriately completes the request.

### Instruction:
{{.Instruction}}

### Response:`

var nonEmptyInput string = `Below is an instruction that describes a task, paired with an input that provides further context. Write a response that appropriately completes the request.

### Instruction:
{{.Instruction}}

### Input:
{{.Input}}

### Response:
`

func llamaFromOptions(ctx *cli.Context) (*llama.LLama, error) {
	opts := []llama.ModelOption{llama.SetContext(ctx.Int("context-size"))}
	return llama.New(ctx.String("model"), opts...)
}

func templateString(t string, in interface{}) (string, error) {
	// Parse the template
	tmpl, err := template.New("prompt").Parse(t)
	if err != nil {
		return "", err
	}

	var buf bytes.Buffer
	err = tmpl.Execute(&buf, in)
	if err != nil {
		return "", err
	}
	return buf.String(), nil
}

var modelFlags = []cli.Flag{
	&cli.StringFlag{
		Name:    "model",
		EnvVars: []string{"MODEL_PATH"},
	},
	&cli.IntFlag{
		Name:    "tokens",
		EnvVars: []string{"TOKENS"},
		Value:   128,
	},
	&cli.IntFlag{
		Name:    "context-size",
		EnvVars: []string{"CONTEXT_SIZE"},
		Value:   512,
	},
	&cli.IntFlag{
		Name:    "threads",
		EnvVars: []string{"THREADS"},
		Value:   runtime.NumCPU(),
	},
	&cli.Float64Flag{
		Name:    "temperature",
		EnvVars: []string{"TEMPERATURE"},
		Value:   0.95,
	},
	&cli.Float64Flag{
		Name:    "topp",
		EnvVars: []string{"TOP_P"},
		Value:   0.85,
	},
	&cli.IntFlag{
		Name:    "topk",
		EnvVars: []string{"TOP_K"},
		Value:   20,
	},
}

func main() {
	app := &cli.App{
		Name:    "llama-cli",
		Version: "0.1",
		Usage:   "llama-cli --model ... --instruction 'What is an alpaca?'",
		Flags: append(modelFlags,
			&cli.StringFlag{
				Name:    "template",
				EnvVars: []string{"TEMPLATE"},
			},
			&cli.StringFlag{
				Name:    "instruction",
				EnvVars: []string{"INSTRUCTION"},
			},
			&cli.StringFlag{
				Name:    "input",
				EnvVars: []string{"INPUT"},
			}),
		Description: `Run llama.cpp inference`,
		UsageText: `
llama-cli --model ~/ggml-alpaca-7b-q4.bin --instruction "What's an alpaca?"

	An Alpaca (Vicugna pacos) is a domesticated species of South American camelid, related to llamas and originally from Peru but now found throughout much of Andean region. They are bred for their fleeces which can be spun into wool or knitted items such as hats, sweaters, blankets etc
		
echo "An Alpaca (Vicugna pacos) is a domesticated species of South American camelid, related to llamas and originally from Peru but now found throughout much of Andean region. They are bred for their fleeces which can be spun into wool or knitted items such as hats, sweaters, blankets etc" | llama-cli --model ~/ggml-alpaca-7b-q4.bin --instruction "Proofread, improving clarity and flow" --input "-"

	An Alpaca (Vicugna pacos) is a domesticated species from South America that's related to llamas. Originating in Peru but now found throughout the Andean region, they are bred for their fleeces which can be spun into wool or knitted items such as hats and sweaters—blankets too!
`,
		Copyright: "go-skynet authors",
		Commands: []*cli.Command{
			{
				Flags: modelFlags,
				Name:  "interactive",
				Action: func(ctx *cli.Context) error {

					l, err := llamaFromOptions(ctx)
					if err != nil {
						fmt.Println("Loading the model failed:", err.Error())
						os.Exit(1)
					}

					return startInteractive(l, llama.SetTemperature(ctx.Float64("temperature")),
						llama.SetTopP(ctx.Float64("topp")),
						llama.SetTopK(ctx.Int("topk")),
						llama.SetTokens(ctx.Int("tokens")),
						llama.SetThreads(ctx.Int("threads")))
				},
			},
			{

				Name: "api",
				Flags: []cli.Flag{
					&cli.IntFlag{
						Name:    "threads",
						EnvVars: []string{"THREADS"},
						Value:   runtime.NumCPU(),
					},
					&cli.StringFlag{
						Name:    "model",
						EnvVars: []string{"MODEL_PATH"},
					},
					&cli.StringFlag{
						Name:    "address",
						EnvVars: []string{"ADDRESS"},
						Value:   ":8080",
					},
					&cli.IntFlag{
						Name:    "context-size",
						EnvVars: []string{"CONTEXT_SIZE"},
						Value:   512,
					},
				},
				Action: func(ctx *cli.Context) error {
					l, err := llamaFromOptions(ctx)
					if err != nil {
						fmt.Println("Loading the model failed:", err.Error())
						os.Exit(1)
					}

					return api(l, ctx.String("address"), ctx.Int("threads"))
				},
			},
		},
		Action: func(ctx *cli.Context) error {

			instruction := ctx.String("instruction")
			input := ctx.String("input")
			templ := ctx.String("template")

			promptTemplate := ""

			if input != "" {
				promptTemplate = nonEmptyInput
			} else {
				promptTemplate = emptyInput
			}

			if templ != "" {
				dat, err := os.ReadFile(templ)
				if err != nil {
					fmt.Printf("Failed reading file: %s", err.Error())
					os.Exit(1)
				}
				promptTemplate = string(dat)
			}

			if instruction == "-" {
				dat, err := ioutil.ReadAll(os.Stdin)
				if err != nil {
					fmt.Printf("reading stdin failed: %s", err)
					os.Exit(1)
				}
				instruction = string(dat)
			}

			if input == "-" {
				dat, err := ioutil.ReadAll(os.Stdin)
				if err != nil {
					fmt.Printf("reading stdin failed: %s", err)
					os.Exit(1)
				}
				input = string(dat)
			}

			str, err := templateString(promptTemplate, struct {
				Instruction string
				Input       string
			}{Instruction: instruction, Input: input})

			if err != nil {
				fmt.Println("Templating the input failed:", err.Error())
				os.Exit(1)
			}

			l, err := llamaFromOptions(ctx)
			if err != nil {
				fmt.Println("Loading the model failed:", err.Error())
				os.Exit(1)
			}

			res, err := l.Predict(
				str,
				llama.SetTemperature(ctx.Float64("temperature")),
				llama.SetTopP(ctx.Float64("topp")),
				llama.SetTopK(ctx.Int("topk")),
				llama.SetTokens(ctx.Int("tokens")),
				llama.SetThreads(ctx.Int("threads")),
			)
			if err != nil {
				fmt.Printf("predicting failed: %s", err)
				os.Exit(1)
			}
			fmt.Println(res)
			return nil
		},
	}

	err := app.Run(os.Args)
	if err != nil {
		fmt.Println(err)
		os.Exit(1)
	}
}
First import 2 years ago			`package main`

			`import (`
			`"bytes"`
			`"fmt"`
			`"io/ioutil"`
			`"os"`
			`"runtime"`
			`"text/template"`

Use go-llama.cpp 2 years ago			`llama "github.com/go-skynet/go-llama.cpp"`
First import 2 years ago			`"github.com/urfave/cli/v2"`
			`)`

			`// Define the template string`
			var emptyInput string = `Below is an instruction that describes a task. Write a response that appropriately completes the request.

			`### Instruction:`
			`{{.Instruction}}`

			### Response:`

			var nonEmptyInput string = `Below is an instruction that describes a task, paired with an input that provides further context. Write a response that appropriately completes the request.

			`### Instruction:`
			`{{.Instruction}}`

			`### Input:`
			`{{.Input}}`

			`### Response:`
			`

Update llama-go, allow to set context-size and enable alpaca model by default 2 years ago			`func llamaFromOptions(ctx cli.Context) (llama.LLama, error) {`
			`opts := []llama.ModelOption{llama.SetContext(ctx.Int("context-size"))}`
			`return llama.New(ctx.String("model"), opts...)`
			`}`

First import 2 years ago			`func templateString(t string, in interface{}) (string, error) {`
			`// Parse the template`
			`tmpl, err := template.New("prompt").Parse(t)`
			`if err != nil {`
			`return "", err`
			`}`

			`var buf bytes.Buffer`
			`err = tmpl.Execute(&buf, in)`
			`if err != nil {`
			`return "", err`
			`}`
			`return buf.String(), nil`
			`}`

Update llama-go, allow to set context-size and enable alpaca model by default 2 years ago			`var modelFlags = []cli.Flag{`
			`&cli.StringFlag{`
			`Name: "model",`
			`EnvVars: []string{"MODEL_PATH"},`
			`},`
			`&cli.IntFlag{`
			`Name: "tokens",`
			`EnvVars: []string{"TOKENS"},`
			`Value: 128,`
			`},`
			`&cli.IntFlag{`
			`Name: "context-size",`
			`EnvVars: []string{"CONTEXT_SIZE"},`
			`Value: 512,`
			`},`
			`&cli.IntFlag{`
			`Name: "threads",`
			`EnvVars: []string{"THREADS"},`
			`Value: runtime.NumCPU(),`
			`},`
			`&cli.Float64Flag{`
			`Name: "temperature",`
			`EnvVars: []string{"TEMPERATURE"},`
			`Value: 0.95,`
			`},`
			`&cli.Float64Flag{`
			`Name: "topp",`
			`EnvVars: []string{"TOP_P"},`
			`Value: 0.85,`
			`},`
			`&cli.IntFlag{`
			`Name: "topk",`
			`EnvVars: []string{"TOP_K"},`
			`Value: 20,`
			`},`
			`}`

First import 2 years ago			`func main() {`
			`app := &cli.App{`
			`Name: "llama-cli",`
			`Version: "0.1",`
			`Usage: "llama-cli --model ... --instruction 'What is an alpaca?'",`
Update llama-go, allow to set context-size and enable alpaca model by default 2 years ago			`Flags: append(modelFlags,`
First import 2 years ago			`&cli.StringFlag{`
			`Name: "template",`
			`EnvVars: []string{"TEMPLATE"},`
			`},`
			`&cli.StringFlag{`
			`Name: "instruction",`
			`EnvVars: []string{"INSTRUCTION"},`
			`},`
			`&cli.StringFlag{`
			`Name: "input",`
			`EnvVars: []string{"INPUT"},`
Update llama-go, allow to set context-size and enable alpaca model by default 2 years ago			`}),`
First import 2 years ago			Description: `Run llama.cpp inference`,
			UsageText: `
			`llama-cli --model ~/ggml-alpaca-7b-q4.bin --instruction "What's an alpaca?"`

			`An Alpaca (Vicugna pacos) is a domesticated species of South American camelid, related to llamas and originally from Peru but now found throughout much of Andean region. They are bred for their fleeces which can be spun into wool or knitted items such as hats, sweaters, blankets etc`

			`echo "An Alpaca (Vicugna pacos) is a domesticated species of South American camelid, related to llamas and originally from Peru but now found throughout much of Andean region. They are bred for their fleeces which can be spun into wool or knitted items such as hats, sweaters, blankets etc" \| llama-cli --model ~/ggml-alpaca-7b-q4.bin --instruction "Proofread, improving clarity and flow" --input "-"`

			`An Alpaca (Vicugna pacos) is a domesticated species from South America that's related to llamas. Originating in Peru but now found throughout the Andean region, they are bred for their fleeces which can be spun into wool or knitted items such as hats and sweaters—blankets too!`
			`,
			`Copyright: "go-skynet authors",`
			`Commands: []*cli.Command{`
			`{`
Update llama-go, allow to set context-size and enable alpaca model by default 2 years ago			`Flags: modelFlags,`
			`Name: "interactive",`
			`Action: func(ctx *cli.Context) error {`

			`l, err := llamaFromOptions(ctx)`
			`if err != nil {`
			`fmt.Println("Loading the model failed:", err.Error())`
			`os.Exit(1)`
			`}`

			`return startInteractive(l, llama.SetTemperature(ctx.Float64("temperature")),`
			`llama.SetTopP(ctx.Float64("topp")),`
			`llama.SetTopK(ctx.Int("topk")),`
			`llama.SetTokens(ctx.Int("tokens")),`
			`llama.SetThreads(ctx.Int("threads")))`
			`},`
			`},`
			`{`

First import 2 years ago			`Name: "api",`
			`Flags: []cli.Flag{`
			`&cli.IntFlag{`
			`Name: "threads",`
			`EnvVars: []string{"THREADS"},`
			`Value: runtime.NumCPU(),`
			`},`
			`&cli.StringFlag{`
			`Name: "model",`
			`EnvVars: []string{"MODEL_PATH"},`
			`},`
			`&cli.StringFlag{`
			`Name: "address",`
			`EnvVars: []string{"ADDRESS"},`
			`Value: ":8080",`
			`},`
Update llama-go, allow to set context-size and enable alpaca model by default 2 years ago			`&cli.IntFlag{`
			`Name: "context-size",`
			`EnvVars: []string{"CONTEXT_SIZE"},`
			`Value: 512,`
			`},`
First import 2 years ago			`},`
			`Action: func(ctx *cli.Context) error {`
Update llama-go, allow to set context-size and enable alpaca model by default 2 years ago			`l, err := llamaFromOptions(ctx)`
			`if err != nil {`
			`fmt.Println("Loading the model failed:", err.Error())`
			`os.Exit(1)`
			`}`

			`return api(l, ctx.String("address"), ctx.Int("threads"))`
First import 2 years ago			`},`
			`},`
			`},`
			`Action: func(ctx *cli.Context) error {`

			`instruction := ctx.String("instruction")`
			`input := ctx.String("input")`
			`templ := ctx.String("template")`

			`promptTemplate := ""`

			`if input != "" {`
			`promptTemplate = nonEmptyInput`
			`} else {`
			`promptTemplate = emptyInput`
			`}`

			`if templ != "" {`
			`dat, err := os.ReadFile(templ)`
			`if err != nil {`
			`fmt.Printf("Failed reading file: %s", err.Error())`
			`os.Exit(1)`
			`}`
			`promptTemplate = string(dat)`
			`}`

			`if instruction == "-" {`
			`dat, err := ioutil.ReadAll(os.Stdin)`
			`if err != nil {`
			`fmt.Printf("reading stdin failed: %s", err)`
			`os.Exit(1)`
			`}`
			`instruction = string(dat)`
			`}`

			`if input == "-" {`
			`dat, err := ioutil.ReadAll(os.Stdin)`
			`if err != nil {`
			`fmt.Printf("reading stdin failed: %s", err)`
			`os.Exit(1)`
			`}`
			`input = string(dat)`
			`}`

			`str, err := templateString(promptTemplate, struct {`
			`Instruction string`
			`Input string`
			`}{Instruction: instruction, Input: input})`

			`if err != nil {`
			`fmt.Println("Templating the input failed:", err.Error())`
			`os.Exit(1)`
			`}`
Update llama-go, allow to set context-size and enable alpaca model by default 2 years ago
			`l, err := llamaFromOptions(ctx)`
First import 2 years ago			`if err != nil {`
			`fmt.Println("Loading the model failed:", err.Error())`
			`os.Exit(1)`
			`}`
Update llama-go, allow to set context-size and enable alpaca model by default 2 years ago
First import 2 years ago			`res, err := l.Predict(`
			`str,`
			`llama.SetTemperature(ctx.Float64("temperature")),`
			`llama.SetTopP(ctx.Float64("topp")),`
			`llama.SetTopK(ctx.Int("topk")),`
			`llama.SetTokens(ctx.Int("tokens")),`
			`llama.SetThreads(ctx.Int("threads")),`
			`)`
			`if err != nil {`
			`fmt.Printf("predicting failed: %s", err)`
			`os.Exit(1)`
			`}`
			`fmt.Println(res)`
			`return nil`
			`},`
			`}`

			`err := app.Run(os.Args)`
			`if err != nil {`
			`fmt.Println(err)`
			`os.Exit(1)`
			`}`
			`}`