ml

package

v0.0.0-...-0e1d3c2 Latest Latest Go to latest Published: May 16, 2023 License: MIT Imports: 9 Imported by: 0

Details

Valid go.mod file
Redistributable license
Tagged version
Stable version
Learn more about best practices

Repository

github.com/extrame/llama.go

Links

Open Source Insights

Documentation ¶

Rendered for

Index ¶

Constants
Variables
func AreSameShape(a, b *Tensor) bool
func BuildForwardExpand(graph *Graph, tensor *Tensor)
func BuildForwardImpl(graph *Graph, tensor *Tensor, expand bool)
func CanMulMat(t0, t1 *Tensor) bool
func CheckGraph()
func ComputeBackward(ctx *Context, tensor *Tensor, inplace bool)
func ComputeForward(ctx *Context, graph *Graph, params *ComputeParams, tensor *Tensor)
func ComputeForwardAddFP32(params *ComputeParams, src0, src1, dst *Tensor)
func ComputeForwardCopy(params *ComputeParams, src0, dst *Tensor)
func ComputeForwardDiagMaskInfFP32(params *ComputeParams, src0, src1, dst *Tensor)
func ComputeForwardDupFP32(params *ComputeParams, src0, dst *Tensor)
func ComputeForwardGetRows(params *ComputeParams, src0, src1, dst *Tensor)
func ComputeForwardMulFP32(params *ComputeParams, src0, src1, dst *Tensor)
func ComputeForwardMulMatFP32(params *ComputeParams, src0, src1, dst *Tensor)
func ComputeForwardPermute(params *ComputeParams, src0 *Tensor)
func ComputeForwardRMSNormFP32(params *ComputeParams, src0, dst *Tensor)
func ComputeForwardRepeatFP32(params *ComputeParams, src0, dst *Tensor)
func ComputeForwardReshape(params *ComputeParams, src0, dst *Tensor)
func ComputeForwardRopeFP32(params *ComputeParams, src0, src1, dst *Tensor)
func ComputeForwardScaleFP32(params *ComputeParams, src0, src1, dst *Tensor)
func ComputeForwardSiluFP32(params *ComputeParams, src0, dst *Tensor)
func ComputeForwardSoftMaxFP32(params *ComputeParams, src0, dst *Tensor)
func ComputeForwardView(params *ComputeParams, src0 *Tensor)
func Do(params *ComputeParams, id int)
func GraphCompute(ctx *Context, graph *Graph)
func Init(params InitParams)
func IsMatrix(tensor *Tensor) bool
func IsScalar(tensor *Tensor) bool
func IsVector(tensor *Tensor) bool
func Job(listen <-chan *ComputeParams, id int)
func SiluFP32(x float32) float32
func Token2Str(vocab *Vocab, token uint32) string
func Tokenize(vocab *Vocab, text string, bos bool) []uint32
func TryAddBigram(vocab *Vocab, symbols []Symbol, workQueue *[]Bigram, left, right int)
func TypeSizeFloat(dt DType) float32
func VecAccFP32(n uint32, y, x []float32)
func VecAddFP32(n uint32, z, x, y []float32)
func VecCopyFP32(n uint32, y, x []float32)
func VecDotFP32(n uint32, x, y []float32) float32
func VecMadFP32(n uint32, y, x []float32, v float32)
func VecMaxFP32(n uint32, x []float32) float32
func VecMulFP32(n uint32, z, x, y []float32)
func VecScaleFP32(n uint32, y []float32, v float32)
func VecSiluFP32(n uint32, y, x []float32)
func VisitParents(graph *Graph, node *Tensor)
type Allocator
- func NewAllocator() *Allocator
- func (a *Allocator) Get(size uint32) *[]float32
- func (a *Allocator) GetFixed(size uint32) *[]float32
- func (a *Allocator) Reset()
type Bigram
- func PopMax(queue *[]Bigram) Bigram
type ComputeParams
type Context
- func NewContext(maxThreads int, useAVX, useNEON bool) *Context
- func (ctx *Context) ReleaseContext()
type DType
type Graph
- func BuildBackward(ctx *Context, gf *Graph, keep bool) Graph
- func BuildForward(tensor *Tensor) *Graph
type InitParams
type Symbol
type TaskType
type Tensor
- func Add(ctx *Context, a, b *Tensor) *Tensor
- func AddImpl(ctx *Context, a, b *Tensor, inplace bool) *Tensor
- func AddInplace(ctx *Context, a, b *Tensor) *Tensor
- func Copy(ctx *Context, a, b *Tensor) *Tensor
- func CopyImpl(ctx *Context, a, b *Tensor, inplace bool) *Tensor
- func CopyInplace(ctx *Context, a, b *Tensor) *Tensor
- func DiagMaskInf(ctx *Context, a *Tensor, past uint32) *Tensor
- func Div(ctx *Context, a, b *Tensor) *Tensor
- func DivImpl(ctx *Context, a, b *Tensor, inplace bool) *Tensor
- func DivInplace(ctx *Context, a, b *Tensor, inplace bool) *Tensor
- func DupTensor(ctx *Context, src *Tensor) *Tensor
- func GetRows(ctx *Context, a, b *Tensor) *Tensor
- func Mul(ctx *Context, a, b *Tensor) *Tensor
- func MulImpl(ctx *Context, a, b *Tensor, inplace bool) *Tensor
- func MulInplace(ctx *Context, a, b *Tensor) *Tensor
- func MulMat(ctx *Context, a, b *Tensor) *Tensor
- func NewFP32(ctx *Context, value float32) *Tensor
- func NewTensor(ctx *Context, dt DType, dims uint32, ne0, ne1, ne2, ne3 uint32, data []float32) *Tensor
- func NewTensor1D(ctx *Context, dt DType, ne0 uint32) *Tensor
- func NewTensor2D(ctx *Context, dt DType, ne0, ne1 uint32) *Tensor
- func NewTensor3D(ctx *Context, dt DType, ne0, ne1, ne2 uint32) *Tensor
- func NewTensor4D(ctx *Context, dt DType, ne0, ne1, ne2, ne3 uint32) *Tensor
- func Permute(ctx *Context, a *Tensor, axis0, axis1, axis2, axis3 uint32) *Tensor
- func RMSNorm(ctx *Context, a *Tensor) *Tensor
- func RMSNormImpl(ctx *Context, a *Tensor, inplace bool) *Tensor
- func RMSNormInplace(ctx *Context, a *Tensor) *Tensor
- func Repeat(ctx *Context, a, b *Tensor) *Tensor
- func Reshape3D(ctx *Context, a *Tensor, ne0, ne1, ne2 uint32) *Tensor
- func Rope(ctx *Context, a *Tensor, past, dims, mode uint32) *Tensor
- func Scale(ctx *Context, a, b *Tensor) *Tensor
- func ScaleImpl(ctx *Context, a, b *Tensor, inplace bool) *Tensor
- func ScaleInplace(ctx *Context, a, b *Tensor) *Tensor
- func SetFP32(tensor *Tensor, value float32) *Tensor
- func Sgn(ctx *Context, a *Tensor) *Tensor
- func SgnImpl(ctx *Context, a *Tensor, inplace bool) *Tensor
- func SgnInplace(ctx *Context, a *Tensor) *Tensor
- func Silu(ctx *Context, a *Tensor) *Tensor
- func SiluImpl(ctx *Context, a *Tensor, inplace bool) *Tensor
- func SiluInplace(ctx *Context, a *Tensor) *Tensor
- func SoftMax(ctx *Context, a *Tensor) *Tensor
- func Step(ctx *Context, a *Tensor) *Tensor
- func StepImpl(ctx *Context, a *Tensor, inplace bool) *Tensor
- func StepInplace(ctx *Context, a *Tensor) *Tensor
- func Sub(ctx *Context, a, b *Tensor) *Tensor
- func SubImpl(ctx *Context, a, b *Tensor, inplace bool) *Tensor
- func SubInplace(ctx *Context, a, b *Tensor) *Tensor
- func Sum(ctx *Context, a *Tensor) *Tensor
- func Transpose(ctx *Context, a *Tensor) *Tensor
- func View1D(ctx *Context, a *Tensor, ne0 uint32, offset uint32) *Tensor
- func ViewTensor(ctx *Context, src *Tensor) *Tensor
- func (tensor *Tensor) IsContiguous() bool
- func (t *Tensor) Nbytes() uint32
- func (t *Tensor) Nelements() uint32
- func (t *Tensor) Nrows() uint32
type TokenScore
type Vocab
- func NewVocab(size uint32) *Vocab

Constants ¶

View Source

const (
	DEBUG = false

	MAX_DIMS   = 4
	MAX_NODES  = 4096
	MAX_PARAMS = 16
	MAX_OPT    = 4

	QK = 32 // quantization

	TOKEN_BOS = 1
	TOKEN_EOS = 2
)

View Source

const (
	OP_NONE optype = iota
	OP_DUP
	OP_ADD
	OP_SUB
	OP_MUL
	OP_DIV
	OP_SQR
	OP_SQRT
	OP_SUM
	OP_MEAN
	OP_REPEAT
	OP_ABS
	OP_SGN
	OP_NEG
	OP_STEP
	OP_RELU
	OP_GELU
	OP_SILU
	OP_NORM
	OP_RMS_NORM

	OP_MUL_MAT

	OP_SCALE
	OP_CPY
	OP_RESHAPE
	OP_VIEW
	OP_PERMUTE
	OP_TRANSPOSE
	OP_GET_ROWS
	OP_DIAG_MASK_INF
	OP_SOFT_MAX
	OP_ROPE
	OP_CONV_1D_1S
	OP_CONV_1D_2S

	OP_FLASH_ATTN
	OP_FLASH_FF

	OP_COUNT
)

View Source

const MaxMem = 0 // 28_000_000_000

View Source

const MaxPool = 0 // 2_000_000_000

TODO: Precompute max needed RAM size

View Source

const NewLineToken = 13 // ml.Tokenize(Ctx.Vocab, "\n", false)[0]

Variables ¶

View Source

var BLCK_SIZE [TYPE_COUNT]uint32 = [TYPE_COUNT]uint32{1, 1, QK, QK, 1, 1, 1, 0}

View Source

var TYPE_SIZE [TYPE_COUNT]uint32 = [TYPE_COUNT]uint32{4, 2, 4 + QK/2, 4*2 + QK/2, 1, 2, 4, 0}

View Source

var TableExpFP16 [1 << 16]float16.Float16

precomputed exp table for f16 (128 KB) static ggml_fp16_t table_exp_f16[1 << 16];

Functions ¶

func AreSameShape ¶

func AreSameShape(a, b *Tensor) bool

func CheckGraph ¶

func CheckGraph()

TODO: Implement all the tensor asserts BEFORE the real computing

func ComputeBackward ¶

func ComputeBackward(ctx *Context, tensor *Tensor, inplace bool)

func ComputeForward ¶

func ComputeForward(ctx *Context, graph *Graph, params *ComputeParams, tensor *Tensor)

func ComputeForwardCopy ¶

func ComputeForwardCopy(params *ComputeParams, src0, dst *Tensor)

func ComputeForwardDiagMaskInfFP32 ¶

func ComputeForwardDiagMaskInfFP32(params *ComputeParams, src0, src1, dst *Tensor)

ggml_compute_forward_diag_mask_inf

func ComputeForwardMulMatFP32 ¶

func ComputeForwardMulMatFP32(params *ComputeParams, src0, src1, dst *Tensor)

ggml_compute_forward_mul_mat_f32

func ComputeForwardRMSNormFP32 ¶

func ComputeForwardRMSNormFP32(params *ComputeParams, src0, dst *Tensor)

ggml_compute_forward_rms_norm_f32

func ComputeForwardRepeatFP32 ¶

func ComputeForwardRepeatFP32(params *ComputeParams, src0, dst *Tensor)

ggml_compute_forward_repeat

func ComputeForwardScaleFP32 ¶

func ComputeForwardScaleFP32(params *ComputeParams, src0, src1, dst *Tensor)

ggml_compute_forward_scale_f32

func ComputeForwardSoftMaxFP32 ¶

func ComputeForwardSoftMaxFP32(params *ComputeParams, src0, dst *Tensor)

ggml_compute_forward_soft_max

func Do ¶

func Do(params *ComputeParams, id int)

Do is an experimental alternative for always waiting Job threads

func GraphCompute ¶

func GraphCompute(ctx *Context, graph *Graph)

func IsMatrix ¶

func IsMatrix(tensor *Tensor) bool

func IsScalar ¶

func IsScalar(tensor *Tensor) bool

func IsVector ¶

func IsVector(tensor *Tensor) bool

func Job ¶

func Job(listen <-chan *ComputeParams, id int)

Job is goroutine existing while the computation loop is active The main purpose of the Job is to perform some part of time consuming matrix multiplications TODO: Investigate https://pkg.go.dev/runtime#LockOSThread

func SiluFP32 ¶

func SiluFP32(x float32) float32

Sigmoid Linear Unit (SiLU) function

func Token2Str ¶

func Token2Str(vocab *Vocab, token uint32) string

func Tokenize ¶

func Tokenize(vocab *Vocab, text string, bos bool) []uint32

void tokenize(const std::string & text, std::vector<llama_vocab::id> & output) {

func TryAddBigram ¶

func TryAddBigram(vocab *Vocab, symbols []Symbol, workQueue *[]Bigram, left, right int)

func TypeSizeFloat ¶

func TypeSizeFloat(dt DType) float32

func VecAccFP32 ¶

func VecAccFP32(n uint32, y, x []float32)

ggml_vec_acc_f32

func VecAddFP32 ¶

func VecAddFP32(n uint32, z, x, y []float32)

inline static void ggml_vec_add_f32 (const int n, float * z, const float * x, const float * y) { for (int i = 0; i < n; ++i) z[i] = x[i] + y[i]; }

func VecCopyFP32 ¶

func VecCopyFP32(n uint32, y, x []float32)

func VecDotFP32 ¶

func VecDotFP32(n uint32, x, y []float32) float32

ggml_vec_dot_f32

func VecMadFP32 ¶

func VecMadFP32(n uint32, y, x []float32, v float32)

ggml_vec_mad_f32

func VecMaxFP32 ¶

func VecMaxFP32(n uint32, x []float32) float32

func VecMulFP32 ¶

func VecMulFP32(n uint32, z, x, y []float32)

func VecScaleFP32 ¶

func VecScaleFP32(n uint32, y []float32, v float32)

ggml_vec_scale_f32

func VecSiluFP32 ¶

func VecSiluFP32(n uint32, y, x []float32)

inline static void ggml_vec_silu_f32(const int n, float * y, const float * x) {

func VisitParents ¶

func VisitParents(graph *Graph, node *Tensor)

ggml_visit_parents

Types ¶

type Allocator ¶

type Allocator struct {
	sync.Mutex

	PoolSize int
	MemSize  int

	Pool []byte
	Mem  []byte
}

Allocator is an experimental memory pool for FP32 slices TODO: Investigate https://github.com/valyala/bytebufferpool

func NewAllocator ¶

func NewAllocator() *Allocator

func (*Allocator) Get ¶

func (a *Allocator) Get(size uint32) *[]float32

Get new or reuse memory buffer of size bytes

func (*Allocator) GetFixed ¶

func (a *Allocator) GetFixed(size uint32) *[]float32

Get fixed memory buffer of size bytes

func (*Allocator) Reset ¶

func (a *Allocator) Reset()

type Bigram ¶

type Bigram struct {

	// NB! Allow -1
	Left  int
	Right int

	Score float32
	Size  uint32
}

struct llama_sp_bigram {

func PopMax ¶

func PopMax(queue *[]Bigram) Bigram

type ComputeParams ¶

type ComputeParams struct {
	Type TaskType

	UseAVX  bool
	UseNEON bool
	// contains filtered or unexported fields
}

type Context ¶

type Context struct {
	MaxThreads int
	UseAVX     bool
	UseNEON    bool
	//Graph      *Graph
	Compute   chan *ComputeParams
	Allocator *Allocator
}

func NewContext ¶

func NewContext(maxThreads int, useAVX, useNEON bool) *Context

func (*Context) ReleaseContext ¶

func (ctx *Context) ReleaseContext()

ReleaseContext frees all context resources - channel will be closed and goroutines stopped

type DType ¶

type DType uint8

const (
	TYPE_F32   DType = 0
	TYPE_F16   DType = 1
	TYPE_Q4_0  DType = 2
	TYPE_Q4_1  DType = 3
	TYPE_I8    DType = 4
	TYPE_I16   DType = 5
	TYPE_I32   DType = 6
	TYPE_COUNT DType = 8
)

Data types are the same as in llama.cpp so full compatibility there

type Graph ¶

type Graph struct {
	NodesCount uint32
	LeafsCount uint32

	Jobs chan *ComputeParams

	Nodes [MAX_NODES]*Tensor
	Grads [MAX_NODES]*Tensor
	Leafs [MAX_NODES]*Tensor
}

computation graph

func BuildBackward ¶

func BuildBackward(ctx *Context, gf *Graph, keep bool) Graph

func BuildForward ¶

func BuildForward(tensor *Tensor) *Graph

type InitParams ¶

type InitParams struct {
}

type Symbol ¶

type Symbol struct {

	// NB! Allow -1
	Prev int
	Next int

	Text string
	N    uint32
}

struct llama_sp_symbol {

type TaskType ¶

type TaskType uint8

const (
	TASK_INIT     TaskType = 0
	TASK_COMPUTE  TaskType = 1
	TASK_FINALIZE TaskType = 2
)

type Tensor ¶

type Tensor struct {
	Type DType

	Reusable bool // this tensor Data buffer might be reused with pooling

	Dims uint32

	NE [MAX_DIMS]uint32 // number of elements
	NB [MAX_DIMS]uint32 // stride in bytes

	TasksCount int

	Data []float32
	// contains filtered or unexported fields
}

func Add ¶

func Add(ctx *Context, a, b *Tensor) *Tensor

func AddImpl ¶

func AddImpl(ctx *Context, a, b *Tensor, inplace bool) *Tensor

ggml_add

func AddInplace ¶

func AddInplace(ctx *Context, a, b *Tensor) *Tensor

func Copy ¶

func Copy(ctx *Context, a, b *Tensor) *Tensor

func CopyImpl ¶

func CopyImpl(ctx *Context, a, b *Tensor, inplace bool) *Tensor

ggml_cpy

func CopyInplace ¶

func CopyInplace(ctx *Context, a, b *Tensor) *Tensor

func DiagMaskInf ¶

func DiagMaskInf(ctx *Context, a *Tensor, past uint32) *Tensor

ggml_diag_mask_inf

func Div ¶

func Div(ctx *Context, a, b *Tensor) *Tensor

func DivImpl ¶

func DivImpl(ctx *Context, a, b *Tensor, inplace bool) *Tensor

ggml_div

func DivInplace ¶

func DivInplace(ctx *Context, a, b *Tensor, inplace bool) *Tensor

func DupTensor ¶

func DupTensor(ctx *Context, src *Tensor) *Tensor

ggml_dup_tensor

func GetRows ¶

func GetRows(ctx *Context, a, b *Tensor) *Tensor

ggml_get_rows

func Mul ¶

func Mul(ctx *Context, a, b *Tensor) *Tensor

struct ggml_tensor * Mul(

func MulImpl ¶

func MulImpl(ctx *Context, a, b *Tensor, inplace bool) *Tensor

struct ggml_tensor * Mul_impl(

func MulInplace ¶

func MulInplace(ctx *Context, a, b *Tensor) *Tensor

struct ggml_tensor * Mul_inplace(

func MulMat ¶

func MulMat(ctx *Context, a, b *Tensor) *Tensor

ggml_mul_mat

func NewFP32 ¶

func NewFP32(ctx *Context, value float32) *Tensor

ggml_new_f32

func NewTensor ¶

func NewTensor(ctx *Context, dt DType, dims uint32, ne0, ne1, ne2, ne3 uint32, data []float32) *Tensor

ggml_new_tensor_impl

func NewTensor1D ¶

func NewTensor1D(ctx *Context, dt DType, ne0 uint32) *Tensor

ggml_new_tensor_1d

func NewTensor2D ¶

func NewTensor2D(ctx *Context, dt DType, ne0, ne1 uint32) *Tensor

ggml_new_tensor_2d

func NewTensor3D ¶

func NewTensor3D(ctx *Context, dt DType, ne0, ne1, ne2 uint32) *Tensor

func NewTensor4D ¶

func NewTensor4D(ctx *Context, dt DType, ne0, ne1, ne2, ne3 uint32) *Tensor

func Permute ¶

func Permute(ctx *Context, a *Tensor, axis0, axis1, axis2, axis3 uint32) *Tensor

ggml_permute

func RMSNorm ¶

func RMSNorm(ctx *Context, a *Tensor) *Tensor

func RMSNormImpl ¶

func RMSNormImpl(ctx *Context, a *Tensor, inplace bool) *Tensor

ggml_rms_norm_impl

func RMSNormInplace ¶

func RMSNormInplace(ctx *Context, a *Tensor) *Tensor

func Repeat ¶

func Repeat(ctx *Context, a, b *Tensor) *Tensor

struct ggml_tensor * Repeat(

func Reshape3D ¶

func Reshape3D(ctx *Context, a *Tensor, ne0, ne1, ne2 uint32) *Tensor

func Rope ¶

func Rope(ctx *Context, a *Tensor, past, dims, mode uint32) *Tensor

ggml_rope

func Scale ¶

func Scale(ctx *Context, a, b *Tensor) *Tensor

func ScaleImpl ¶

func ScaleImpl(ctx *Context, a, b *Tensor, inplace bool) *Tensor

ggml_scale

func ScaleInplace ¶

func ScaleInplace(ctx *Context, a, b *Tensor) *Tensor

func SetFP32 ¶

func SetFP32(tensor *Tensor, value float32) *Tensor

ggml_set_f32

func Sgn ¶

func Sgn(ctx *Context, a *Tensor) *Tensor

func SgnImpl ¶

func SgnImpl(ctx *Context, a *Tensor, inplace bool) *Tensor

ggml_sgn

func SgnInplace ¶

func SgnInplace(ctx *Context, a *Tensor) *Tensor

func Silu ¶

func Silu(ctx *Context, a *Tensor) *Tensor

func SiluImpl ¶

func SiluImpl(ctx *Context, a *Tensor, inplace bool) *Tensor

func SiluInplace ¶

func SiluInplace(ctx *Context, a *Tensor) *Tensor

func SoftMax ¶

func SoftMax(ctx *Context, a *Tensor) *Tensor

ggml_soft_max

func Step ¶

func Step(ctx *Context, a *Tensor) *Tensor

func StepImpl ¶

func StepImpl(ctx *Context, a *Tensor, inplace bool) *Tensor

ggml_step

func StepInplace ¶

func StepInplace(ctx *Context, a *Tensor) *Tensor

func Sub ¶

func Sub(ctx *Context, a, b *Tensor) *Tensor

func SubImpl ¶

func SubImpl(ctx *Context, a, b *Tensor, inplace bool) *Tensor

ggml_sub

func SubInplace ¶

func SubInplace(ctx *Context, a, b *Tensor) *Tensor

func Sum ¶

func Sum(ctx *Context, a *Tensor) *Tensor

ggml_sum

func Transpose ¶

func Transpose(ctx *Context, a *Tensor) *Tensor

func View1D ¶

func View1D(ctx *Context, a *Tensor, ne0 uint32, offset uint32) *Tensor

ggml_view_1d NB! Originally offset in bytes, but here in floats (4-bytes)

func ViewTensor ¶

func ViewTensor(ctx *Context, src *Tensor) *Tensor

ggml_view_tensor

func (*Tensor) IsContiguous ¶

func (tensor *Tensor) IsContiguous() bool

ggml_is_contiguous

func (*Tensor) Nbytes ¶

func (t *Tensor) Nbytes() uint32

ggml_nbytes

func (*Tensor) Nelements ¶

func (t *Tensor) Nelements() uint32

func (*Tensor) Nrows ¶

func (t *Tensor) Nrows() uint32

type TokenScore ¶

type TokenScore struct {
	Token string
	Score float32
}

type Vocab ¶

type Vocab struct {
	Size     uint32
	Token2ID map[string]uint32
	ID2Token []TokenScore
}

func NewVocab ¶

func NewVocab(size uint32) *Vocab

Source Files ¶

View all Source files

?	: This menu
/	: Search site
f or F	: Jump to
y or Y	: Canonical URL

Documentation ¶

Index ¶

Constants ¶

Variables ¶

Functions ¶

func AreSameShape ¶

func BuildForwardExpand ¶

func BuildForwardImpl ¶

func CanMulMat ¶

func CheckGraph ¶

func ComputeBackward ¶

func ComputeForward ¶

func ComputeForwardAddFP32 ¶

func ComputeForwardCopy ¶

func ComputeForwardDiagMaskInfFP32 ¶

func ComputeForwardDupFP32 ¶

func ComputeForwardGetRows ¶

func ComputeForwardMulFP32 ¶

func ComputeForwardMulMatFP32 ¶

func ComputeForwardPermute ¶

func ComputeForwardRMSNormFP32 ¶

func ComputeForwardRepeatFP32 ¶

func ComputeForwardReshape ¶

func ComputeForwardRopeFP32 ¶

func ComputeForwardScaleFP32 ¶

func ComputeForwardSiluFP32 ¶

func ComputeForwardSoftMaxFP32 ¶

func ComputeForwardView ¶

func Do ¶

func GraphCompute ¶

func Init ¶

func IsMatrix ¶

func IsScalar ¶

func IsVector ¶

func Job ¶

func SiluFP32 ¶

func Token2Str ¶

func Tokenize ¶

func TryAddBigram ¶

func TypeSizeFloat ¶

func VecAccFP32 ¶

func VecAddFP32 ¶

func VecCopyFP32 ¶

func VecDotFP32 ¶

func VecMadFP32 ¶

func VecMaxFP32 ¶

func VecMulFP32 ¶

func VecScaleFP32 ¶

func VecSiluFP32 ¶

func VisitParents ¶

Types ¶

type Allocator ¶

func NewAllocator ¶

func (*Allocator) Get ¶

func (*Allocator) GetFixed ¶

func (*Allocator) Reset ¶

type Bigram ¶

func PopMax ¶

type ComputeParams ¶

type Context ¶

func NewContext ¶

func (*Context) ReleaseContext ¶

type DType ¶

type Graph ¶

func BuildBackward ¶

func BuildForward ¶

type InitParams ¶

type Symbol ¶

type TaskType ¶

type Tensor ¶

func Add ¶

func AddImpl ¶

func AddInplace ¶

func Copy ¶

func CopyImpl ¶

func CopyInplace ¶

func DiagMaskInf ¶

func Div ¶

func DivImpl ¶

func DivInplace ¶