llama2

package

v0.9.8 Latest Latest Go to latest Published: Nov 27, 2024 License: Apache-2.0 Imports: 2 Imported by: 0

Details

Valid go.mod file
Redistributable license
Tagged version
Stable version
Learn more about best practices

Repository

github.com/goplus/llgo

Links

Open Source Insights

README ¶

LLGo wrapper of karpathy/llama2.c

How to update source to llgo

git submodule init
git submodule update
cp llama2.c/run.c llama2/run.c

Documentation ¶

Index ¶

Constants
func BuildSampler(sampler *Sampler, vocabSize c.Int, temperature c.Float, topp c.Float, ...)
func BuildTokenizer(t *Tokenizer, tokenizerPath *c.Char, vocabSize c.Int)
func BuildTransformer(t *Transformer, checkpointPath *c.Char)
func Chat(transformer *Transformer, tokenizer *Tokenizer, sampler *Sampler, ...)
func FreeSampler(sampler *Sampler)
func FreeTokenizer(t *Tokenizer)
func FreeTransformer(t *Transformer)
func Generate(transformer *Transformer, tokenizer *Tokenizer, sampler *Sampler, ...)
type Config
type ProbIndex
type RunState
type Sampler
type TokenIndex
type Tokenizer
type Transformer
type TransformerWeights

Constants ¶

View Source

const (
	LLGoFiles   = "llama2/llama2.c"
	LLGoPackage = "link: -lm"
)

Variables ¶

This section is empty.

Functions ¶

func BuildSampler ¶

func BuildSampler(sampler *Sampler, vocabSize c.Int, temperature c.Float, topp c.Float, rngSeed uint64)

func BuildTokenizer ¶

func BuildTokenizer(t *Tokenizer, tokenizerPath *c.Char, vocabSize c.Int)

func BuildTransformer ¶

func BuildTransformer(t *Transformer, checkpointPath *c.Char)

func Chat ¶

func Chat(
	transformer *Transformer, tokenizer *Tokenizer, sampler *Sampler,
	cliUserPrompt *c.Char, cliSystemPrompt *c.Char, steps c.Int)

func FreeSampler ¶

func FreeSampler(sampler *Sampler)

func FreeTokenizer ¶

func FreeTokenizer(t *Tokenizer)

func FreeTransformer ¶

func FreeTransformer(t *Transformer)

func Generate ¶

func Generate(
	transformer *Transformer, tokenizer *Tokenizer, sampler *Sampler,
	prompt *c.Char, steps c.Int)

Types ¶

type Config ¶

type Config struct {
	Dim       c.Int // transformer dimension
	HiddenDim c.Int // for ffn layers
	NLayers   c.Int // number of layers
	NHeads    c.Int // number of query heads
	NKVHeads  c.Int // number of key/value heads (can be < query heads because of multiquery)
	VocabSize c.Int // vocabulary size, usually 256 (byte-level)
	SeqLen    c.Int // max sequence length
}

llgo:type C

type ProbIndex ¶

type ProbIndex struct {
	Prob  c.Float
	Index c.Int

} // struct used when sorting probabilities during top-p sampling

llgo:type C

type RunState ¶

type RunState struct {
	// current wave of activations
	X      *c.Float // activation at current time stamp (dim,)
	Xb     *c.Float // same, but inside a residual branch (dim,)
	Xb2    *c.Float // an additional buffer just for convenience (dim,)
	Hb     *c.Float // buffer for hidden dimension in the ffn (hidden_dim,)
	Hb2    *c.Float // buffer for hidden dimension in the ffn (hidden_dim,)
	Q      *c.Float // query (dim,)
	K      *c.Float // key (dim,)
	V      *c.Float // value (dim,)
	Att    *c.Float // buffer for scores/attention values (n_heads, seq_len)
	Logits *c.Float // output logits
	// kv cache
	KeyCache   *c.Float // (layer, seq_len, dim)
	ValueCache *c.Float // (layer, seq_len, dim)
}

llgo:type C

type Sampler ¶

type Sampler struct {
	VocabSize   c.Int
	Probindex   *ProbIndex // buffer used in top-p sampling
	Temperature c.Float
	Topp        c.Float
	RngState    uint64
}

llgo:type C

type TokenIndex ¶

type TokenIndex struct {
	Str *c.Char
	Id  c.Int
}

llgo:type C

type Tokenizer ¶

type Tokenizer struct {
	Vocab          **c.Char
	VocabScores    *c.Float
	SortedVocab    *TokenIndex
	VocabSize      c.Int
	MaxTokenLength c.Uint
	BytePieces     [512]uint8 // stores all single-byte strings
}

llgo:type C

type Transformer ¶

type Transformer struct {
	Config  Config             // the hyperparameters of the architecture (the blueprint)
	Weights TransformerWeights // the weights of the model
	State   RunState           // buffers for the "wave" of activations in the forward pass

	// some more state needed to properly clean up the memory mapping (sigh)
	Fd       c.Int    // file descriptor for memory mapping
	Data     *c.Float // memory mapped data pointer
	FileSize uintptr  // size of the checkpoint file in bytes
}

llgo:type C

type TransformerWeights ¶

type TransformerWeights struct {
	// token embedding table
	TokenEmbeddingTable *c.Float // (vocab_size, dim)
	// weights for rmsnorms
	RmsAttWeight *c.Float // (layer, dim) rmsnorm weights
	RmsFfnWeight *c.Float // (layer, dim)
	// weights for matmuls. note dim == n_heads * head_size
	Wq *c.Float // (layer, dim, n_heads * head_size)
	Wk *c.Float // (layer, dim, n_kv_heads * head_size)
	Wv *c.Float // (layer, dim, n_kv_heads * head_size)
	Wo *c.Float // (layer, n_heads * head_size, dim)
	// weights for ffn
	W1 *c.Float // (layer, hidden_dim, dim)
	W2 *c.Float // (layer, dim, hidden_dim)
	W3 *c.Float // (layer, hidden_dim, dim)
	// final rmsnorm
	RmsFinalWeight *c.Float // (dim,)
	// (optional) classifier weights for the logits, on the last layer
	Wcls *c.Float
}

llgo:type C

Source Files ¶

View all Source files

llama2.go

?	: This menu
/	: Search site
f or F	: Jump to
y or Y	: Canonical URL