Expand description
Build Info
- GGML Commit: unknown
- GGML Commit Time: 1755364212
§ggml-ffi
Low-level Rust FFI bindings to the GGML C API shipped in this repository under ggml/.
There are no semantic versioning guarantees. Each version of this crate is tied to a specific GGML commit. This crate’s version should only be used to pin GGML revisions.
§Features
- metal: Enable GGML_METAL backend and link Metal frameworks on Apple.
- cuda: Enable GGML_CUDA backend and link CUDA runtime/BLAS libraries.
- vulkan: Enable GGML_VULKAN backend and link libvulkan.
- opencl: Enable GGML_OPENCL backend and link OpenCL (framework on Apple).
- hip: Enable GGML_HIP backend (requires ROCm toolchain).
- musa: Enable GGML_MUSA backend.
- sycl: Enable GGML_SYCL backend (requires SYCL toolchain).
- webgpu: Enable GGML_WEBGPU backend (requires WebGPU support in ggml).
§Examples
- CPU only (default):
cargo build - Metal on macOS:
cargo build --features metal - CUDA on Linux:
cargo build --features cuda - Vulkan:
cargo build --features vulkan - OpenCL:
cargo build --features opencl
Note: Enabling a backend requires the corresponding SDK/toolchain to be installed and discoverable by CMake.
Structs§
- _IO_
FILE - _IO_
codecvt - _IO_
marker - _IO_
wide_ data - ggml_
backend - ggml_
backend_ buffer - ggml_
backend_ buffer_ type - ggml_
backend_ dev_ caps - ggml_
backend_ dev_ props - ggml_
backend_ device - ggml_
backend_ event - ggml_
backend_ feature - ggml_
backend_ graph_ copy - ggml_
backend_ reg - ggml_
backend_ sched - ggml_
bf16_ t - ggml_
cgraph - ggml_
context - ggml_
cplan - ggml_
gallocr - ggml_
init_ params - ggml_
object - ggml_
opt_ context - ggml_
opt_ dataset - ggml_
opt_ optimizer_ params - ggml_
opt_ optimizer_ params__ bindgen_ ty_ 1 - ggml_
opt_ optimizer_ params__ bindgen_ ty_ 2 - ggml_
opt_ params - ggml_
opt_ result - ggml_
tallocr - ggml_
tensor - ggml_
threadpool - ggml_
threadpool_ params - ggml_
type_ traits - ggml_
type_ traits_ cpu - gguf_
context - gguf_
init_ params
Enums§
- ggml_
backend_ buffer_ usage - ggml_
backend_ dev_ type - ggml_
ftype - ggml_
glu_ op - ggml_
log_ level - ggml_
numa_ strategy - ggml_
object_ type - ggml_op
- ggml_
op_ pool - ggml_
opt_ build_ type - ggml_
opt_ loss_ type - ggml_
opt_ optimizer_ type - ggml_
prec - ggml_
scale_ flag - ggml_
scale_ mode - ggml_
sched_ priority - ggml_
sort_ order - ggml_
status - ggml_
tensor_ flag - ggml_
type - ggml_
unary_ op - gguf_
type
Constants§
- GGML_
CANN_ MAX_ DEVICES - GGML_
COMMIT - ggml submodule commit (short hash).
- GGML_
COMMIT_ TIME - ggml submodule commit time (ISO 8601 or fallback).
- GGML_
CUBLAS_ NAME - GGML_
CUDA_ MAX_ DEVICES - GGML_
CUDA_ NAME - GGML_
DEFAULT_ GRAPH_ SIZE - GGML_
DEFAULT_ N_ THREADS - GGML_
EXIT_ ABORTED - GGML_
EXIT_ SUCCESS - GGML_
FILE_ MAGIC - GGML_
FILE_ VERSION - GGML_
KQ_ MASK_ PAD - GGML_
MAX_ DIMS - GGML_
MAX_ NAME - GGML_
MAX_ N_ THREADS - GGML_
MAX_ OP_ PARAMS - GGML_
MAX_ PARAMS - GGML_
MAX_ SRC - GGML_
MEM_ ALIGN - GGML_
MROPE_ SECTIONS - GGML_
N_ TASKS_ MAX - GGML_
QNT_ VERSION - GGML_
QNT_ VERSION_ FACTOR - GGML_
ROPE_ TYPE_ MROPE - GGML_
ROPE_ TYPE_ NEOX - GGML_
ROPE_ TYPE_ VISION - GGML_
RPC_ MAX_ SERVERS - GGML_
SYCL_ MAX_ DEVICES - GGML_
SYCL_ NAME - GGML_
TENSOR_ SIZE - GGML_
VK_ MAX_ DEVICES - GGML_
VK_ NAME - GGML_
WEBGPU_ NAME - GGUF_
DEFAULT_ ALIGNMENT - GGUF_
KEY_ GENERAL_ ALIGNMENT - GGUF_
MAGIC - GGUF_
VERSION
Functions§
- ggml_
abort ⚠ - ggml_
abs ⚠ - ggml_
abs_ ⚠inplace - ggml_
acc ⚠ - ggml_
acc_ ⚠inplace - ggml_
add ⚠ - ggml_
add1 ⚠ - ggml_
add1_ ⚠inplace - ggml_
add_ ⚠cast - ggml_
add_ ⚠id - ggml_
add_ ⚠inplace - ggml_
add_ ⚠rel_ pos - ggml_
add_ ⚠rel_ pos_ inplace - ggml_
arange ⚠ - ggml_
are_ ⚠same_ shape - ggml_
are_ ⚠same_ stride - ggml_
argmax ⚠ - ggml_
argsort ⚠ - ggml_
backend_ ⚠alloc_ buffer - ggml_
backend_ ⚠alloc_ ctx_ tensors - ggml_
backend_ ⚠alloc_ ctx_ tensors_ from_ buft - ggml_
backend_ ⚠blas_ init - ggml_
backend_ ⚠blas_ reg - ggml_
backend_ ⚠blas_ set_ n_ threads - ggml_
backend_ ⚠buffer_ clear - ggml_
backend_ ⚠buffer_ free - ggml_
backend_ ⚠buffer_ get_ alignment - ggml_
backend_ ⚠buffer_ get_ alloc_ size - ggml_
backend_ ⚠buffer_ get_ base - ggml_
backend_ ⚠buffer_ get_ max_ size - ggml_
backend_ ⚠buffer_ get_ size - ggml_
backend_ ⚠buffer_ get_ type - ggml_
backend_ ⚠buffer_ get_ usage - ggml_
backend_ ⚠buffer_ init_ tensor - ggml_
backend_ ⚠buffer_ is_ host - ggml_
backend_ ⚠buffer_ name - ggml_
backend_ ⚠buffer_ reset - ggml_
backend_ ⚠buffer_ set_ usage - ggml_
backend_ ⚠buft_ alloc_ buffer - ggml_
backend_ ⚠buft_ get_ alignment - ggml_
backend_ ⚠buft_ get_ alloc_ size - ggml_
backend_ ⚠buft_ get_ device - ggml_
backend_ ⚠buft_ get_ max_ size - ggml_
backend_ ⚠buft_ is_ host - ggml_
backend_ ⚠buft_ name - ggml_
backend_ ⚠cann_ buffer_ type - @brief Retrieves the CANN buffer type for a specified device.
- ggml_
backend_ ⚠cann_ get_ device_ count - @brief Retrieves the number of CANN devices available.
- ggml_
backend_ ⚠cann_ get_ device_ description - @brief Retrieves the description of a specific CANN device.
- ggml_
backend_ ⚠cann_ get_ device_ memory - @brief Retrieves the memory information of a specific CANN device.
- ggml_
backend_ ⚠cann_ host_ buffer_ type - @brief pinned host buffer for use with the CPU backend for faster copies between CPU and NPU.
- ggml_
backend_ ⚠cann_ init - @brief Initializes the CANN backend for a specified device.
- ggml_
backend_ ⚠cann_ reg - ggml_
backend_ ⚠compare_ graph_ backend - ggml_
backend_ ⚠cpu_ buffer_ from_ ptr - ggml_
backend_ ⚠cpu_ buffer_ type - ggml_
backend_ ⚠cpu_ init - ggml_
backend_ ⚠cpu_ reg - ggml_
backend_ ⚠cpu_ set_ abort_ callback - ggml_
backend_ ⚠cpu_ set_ n_ threads - ggml_
backend_ ⚠cpu_ set_ threadpool - ggml_
backend_ ⚠cuda_ buffer_ type - ggml_
backend_ ⚠cuda_ get_ device_ count - ggml_
backend_ ⚠cuda_ get_ device_ description - ggml_
backend_ ⚠cuda_ get_ device_ memory - ggml_
backend_ ⚠cuda_ host_ buffer_ type - ggml_
backend_ ⚠cuda_ init - ggml_
backend_ ⚠cuda_ reg - ggml_
backend_ ⚠cuda_ register_ host_ buffer - ggml_
backend_ ⚠cuda_ split_ buffer_ type - ggml_
backend_ ⚠cuda_ unregister_ host_ buffer - ggml_
backend_ ⚠dev_ backend_ reg - ggml_
backend_ ⚠dev_ buffer_ from_ host_ ptr - ggml_
backend_ ⚠dev_ buffer_ type - ggml_
backend_ ⚠dev_ by_ name - ggml_
backend_ ⚠dev_ by_ type - ggml_
backend_ ⚠dev_ count - ggml_
backend_ ⚠dev_ description - ggml_
backend_ ⚠dev_ get - ggml_
backend_ ⚠dev_ get_ props - ggml_
backend_ ⚠dev_ host_ buffer_ type - ggml_
backend_ ⚠dev_ init - ggml_
backend_ ⚠dev_ memory - ggml_
backend_ ⚠dev_ name - ggml_
backend_ ⚠dev_ offload_ op - ggml_
backend_ ⚠dev_ supports_ buft - ggml_
backend_ ⚠dev_ supports_ op - ggml_
backend_ ⚠dev_ type - ggml_
backend_ ⚠device_ register - ggml_
backend_ ⚠event_ free - ggml_
backend_ ⚠event_ new - ggml_
backend_ ⚠event_ record - ggml_
backend_ ⚠event_ synchronize - ggml_
backend_ ⚠event_ wait - ggml_
backend_ ⚠free - ggml_
backend_ ⚠get_ alignment - ggml_
backend_ ⚠get_ default_ buffer_ type - ggml_
backend_ ⚠get_ device - ggml_
backend_ ⚠get_ max_ size - ggml_
backend_ ⚠graph_ compute - ggml_
backend_ ⚠graph_ compute_ async - ggml_
backend_ ⚠graph_ copy - ggml_
backend_ ⚠graph_ copy_ free - ggml_
backend_ ⚠graph_ plan_ compute - ggml_
backend_ ⚠graph_ plan_ create - ggml_
backend_ ⚠graph_ plan_ free - ggml_
backend_ ⚠guid - ggml_
backend_ ⚠init_ best - ggml_
backend_ ⚠init_ by_ name - ggml_
backend_ ⚠init_ by_ type - ggml_
backend_ ⚠is_ blas - ggml_
backend_ ⚠is_ cann - @brief Checks if a given backend is a CANN backend.
- ggml_
backend_ ⚠is_ cpu - ggml_
backend_ ⚠is_ cuda - ggml_
backend_ ⚠is_ metal - ggml_
backend_ ⚠is_ opencl - ggml_
backend_ ⚠is_ rpc - ggml_
backend_ ⚠is_ sycl - ggml_
backend_ ⚠is_ vk - ggml_
backend_ ⚠load - ggml_
backend_ ⚠load_ all - ggml_
backend_ ⚠load_ all_ from_ path - ggml_
backend_ ⚠metal_ buffer_ from_ ptr - ggml_
backend_ ⚠metal_ buffer_ type - ggml_
backend_ ⚠metal_ capture_ next_ compute - ggml_
backend_ ⚠metal_ init - ggml_
backend_ ⚠metal_ reg - ggml_
backend_ ⚠metal_ set_ abort_ callback - ggml_
backend_ ⚠metal_ supports_ family - ggml_
backend_ ⚠name - ggml_
backend_ ⚠offload_ op - ggml_
backend_ ⚠opencl_ buffer_ type - ggml_
backend_ ⚠opencl_ host_ buffer_ type - ggml_
backend_ ⚠opencl_ init - ggml_
backend_ ⚠opencl_ reg - ggml_
backend_ ⚠reg_ by_ name - ggml_
backend_ ⚠reg_ count - ggml_
backend_ ⚠reg_ dev_ count - ggml_
backend_ ⚠reg_ dev_ get - ggml_
backend_ ⚠reg_ get - ggml_
backend_ ⚠reg_ get_ proc_ address - ggml_
backend_ ⚠reg_ name - ggml_
backend_ ⚠rpc_ add_ device - ggml_
backend_ ⚠rpc_ buffer_ type - ggml_
backend_ ⚠rpc_ get_ device_ memory - ggml_
backend_ ⚠rpc_ init - ggml_
backend_ ⚠rpc_ reg - ggml_
backend_ ⚠rpc_ start_ server - ggml_
backend_ ⚠sched_ alloc_ graph - ggml_
backend_ ⚠sched_ free - ggml_
backend_ ⚠sched_ get_ backend - ggml_
backend_ ⚠sched_ get_ buffer_ size - ggml_
backend_ ⚠sched_ get_ n_ backends - ggml_
backend_ ⚠sched_ get_ n_ copies - ggml_
backend_ ⚠sched_ get_ n_ splits - ggml_
backend_ ⚠sched_ get_ tensor_ backend - ggml_
backend_ ⚠sched_ graph_ compute - ggml_
backend_ ⚠sched_ graph_ compute_ async - ggml_
backend_ ⚠sched_ new - ggml_
backend_ ⚠sched_ reserve - ggml_
backend_ ⚠sched_ reset - ggml_
backend_ ⚠sched_ set_ eval_ callback - ggml_
backend_ ⚠sched_ set_ tensor_ backend - ggml_
backend_ ⚠sched_ synchronize - ggml_
backend_ ⚠supports_ buft - ggml_
backend_ ⚠supports_ op - ggml_
backend_ ⚠sycl_ buffer_ type - ggml_
backend_ ⚠sycl_ get_ device_ count - ggml_
backend_ ⚠sycl_ get_ device_ description - ggml_
backend_ ⚠sycl_ get_ device_ memory - ggml_
backend_ ⚠sycl_ get_ gpu_ list - ggml_
backend_ ⚠sycl_ host_ buffer_ type - ggml_
backend_ ⚠sycl_ init - ggml_
backend_ ⚠sycl_ print_ sycl_ devices - ggml_
backend_ ⚠sycl_ reg - ggml_
backend_ ⚠sycl_ split_ buffer_ type - ggml_
backend_ ⚠synchronize - ggml_
backend_ ⚠tensor_ alloc - ggml_
backend_ ⚠tensor_ copy - ggml_
backend_ ⚠tensor_ copy_ async - ggml_
backend_ ⚠tensor_ get - ggml_
backend_ ⚠tensor_ get_ async - ggml_
backend_ ⚠tensor_ memset - ggml_
backend_ ⚠tensor_ set - ggml_
backend_ ⚠tensor_ set_ async - ggml_
backend_ ⚠unload - ggml_
backend_ ⚠view_ init - ggml_
backend_ ⚠vk_ buffer_ type - ggml_
backend_ ⚠vk_ get_ device_ count - ggml_
backend_ ⚠vk_ get_ device_ description - ggml_
backend_ ⚠vk_ get_ device_ memory - ggml_
backend_ ⚠vk_ host_ buffer_ type - ggml_
backend_ ⚠vk_ init - ggml_
backend_ ⚠vk_ reg - ggml_
backend_ ⚠webgpu_ init - ggml_
backend_ ⚠webgpu_ reg - ggml_
bf16_ ⚠to_ fp32 - ggml_
bf16_ ⚠to_ fp32_ row - ggml_
blck_ ⚠size - ggml_
build_ ⚠backward_ expand - ggml_
build_ ⚠forward_ expand - ggml_
can_ ⚠repeat - ggml_
cast ⚠ - ggml_
clamp ⚠ - ggml_
commit ⚠ - ggml_
concat ⚠ - ggml_
cont ⚠ - ggml_
cont_ ⚠1d - ggml_
cont_ ⚠2d - ggml_
cont_ ⚠3d - ggml_
cont_ ⚠4d - ggml_
conv_ ⚠1d - ggml_
conv_ ⚠1d_ dw - ggml_
conv_ ⚠1d_ dw_ ph - ggml_
conv_ ⚠1d_ ph - ggml_
conv_ ⚠2d - ggml_
conv_ ⚠2d_ direct - ggml_
conv_ ⚠2d_ dw - ggml_
conv_ ⚠2d_ dw_ direct - ggml_
conv_ ⚠2d_ s1_ ph - ggml_
conv_ ⚠2d_ sk_ p0 - ggml_
conv_ ⚠transpose_ 1d - ggml_
conv_ ⚠transpose_ 2d_ p0 - ggml_
cos ⚠ - ggml_
cos_ ⚠inplace - ggml_
count_ ⚠equal - ggml_
cpu_ ⚠bf16_ to_ fp32 - ggml_
cpu_ ⚠fp16_ to_ fp32 - ggml_
cpu_ ⚠fp32_ to_ bf16 - ggml_
cpu_ ⚠fp32_ to_ fp16 - ggml_
cpu_ ⚠fp32_ to_ fp32 - ggml_
cpu_ ⚠get_ sve_ cnt - ggml_
cpu_ ⚠has_ amx_ int8 - ggml_
cpu_ ⚠has_ arm_ fma - ggml_
cpu_ ⚠has_ avx - ggml_
cpu_ ⚠has_ avx2 - ggml_
cpu_ ⚠has_ avx512 - ggml_
cpu_ ⚠has_ avx512_ bf16 - ggml_
cpu_ ⚠has_ avx512_ vbmi - ggml_
cpu_ ⚠has_ avx512_ vnni - ggml_
cpu_ ⚠has_ avx_ vnni - ggml_
cpu_ ⚠has_ bmi2 - ggml_
cpu_ ⚠has_ dotprod - ggml_
cpu_ ⚠has_ f16c - ggml_
cpu_ ⚠has_ fma - ggml_
cpu_ ⚠has_ fp16_ va - ggml_
cpu_ ⚠has_ llamafile - ggml_
cpu_ ⚠has_ matmul_ int8 - ggml_
cpu_ ⚠has_ neon - ggml_
cpu_ ⚠has_ nnpa - ggml_
cpu_ ⚠has_ riscv_ v - ggml_
cpu_ ⚠has_ sme - ggml_
cpu_ ⚠has_ sse3 - ggml_
cpu_ ⚠has_ ssse3 - ggml_
cpu_ ⚠has_ sve - ggml_
cpu_ ⚠has_ vsx - ggml_
cpu_ ⚠has_ vxe - ggml_
cpu_ ⚠has_ wasm_ simd - ggml_
cpu_ ⚠init - ggml_
cpy ⚠ - ggml_
cross_ ⚠entropy_ loss - ggml_
cross_ ⚠entropy_ loss_ back - ggml_
custom_ ⚠4d - ggml_
custom_ ⚠inplace - ggml_
cycles ⚠ - ggml_
cycles_ ⚠per_ ms - ggml_
diag ⚠ - ggml_
diag_ ⚠mask_ inf - ggml_
diag_ ⚠mask_ inf_ inplace - ggml_
diag_ ⚠mask_ zero - ggml_
diag_ ⚠mask_ zero_ inplace - ggml_
div ⚠ - ggml_
div_ ⚠inplace - ggml_
dup ⚠ - ggml_
dup_ ⚠inplace - ggml_
dup_ ⚠tensor - ggml_
element_ ⚠size - ggml_
elu ⚠ - ggml_
elu_ ⚠inplace - ggml_
exp ⚠ - ggml_
exp_ ⚠inplace - ggml_
flash_ ⚠attn_ back - ggml_
flash_ ⚠attn_ ext - ggml_
flash_ ⚠attn_ ext_ add_ sinks - ggml_
flash_ ⚠attn_ ext_ get_ prec - ggml_
flash_ ⚠attn_ ext_ set_ prec - ggml_
fopen ⚠ - ggml_
format_ ⚠name - ggml_
fp16_ ⚠to_ fp32 - ggml_
fp16_ ⚠to_ fp32_ row - ggml_
fp32_ ⚠to_ bf16 - ggml_
fp32_ ⚠to_ bf16_ row - ggml_
fp32_ ⚠to_ bf16_ row_ ref - ggml_
fp32_ ⚠to_ fp16 - ggml_
fp32_ ⚠to_ fp16_ row - ggml_
free ⚠ - ggml_
ftype_ ⚠to_ ggml_ type - ggml_
gallocr_ ⚠alloc_ graph - ggml_
gallocr_ ⚠free - ggml_
gallocr_ ⚠get_ buffer_ size - ggml_
gallocr_ ⚠new - ggml_
gallocr_ ⚠new_ n - ggml_
gallocr_ ⚠reserve - ggml_
gallocr_ ⚠reserve_ n - ggml_
gated_ ⚠linear_ attn - ggml_
geglu ⚠ - ggml_
geglu_ ⚠erf - ggml_
geglu_ ⚠erf_ split - ggml_
geglu_ ⚠erf_ swapped - ggml_
geglu_ ⚠quick - ggml_
geglu_ ⚠quick_ split - ggml_
geglu_ ⚠quick_ swapped - ggml_
geglu_ ⚠split - ggml_
geglu_ ⚠swapped - ggml_
gelu ⚠ - ggml_
gelu_ ⚠erf - ggml_
gelu_ ⚠erf_ inplace - ggml_
gelu_ ⚠inplace - ggml_
gelu_ ⚠quick - ggml_
gelu_ ⚠quick_ inplace - ggml_
get_ ⚠data - ggml_
get_ ⚠data_ f32 - ggml_
get_ ⚠f32_ 1d - ggml_
get_ ⚠f32_ nd - ggml_
get_ ⚠first_ tensor - ggml_
get_ ⚠glu_ op - ggml_
get_ ⚠i32_ 1d - ggml_
get_ ⚠i32_ nd - ggml_
get_ ⚠max_ tensor_ size - ggml_
get_ ⚠mem_ buffer - ggml_
get_ ⚠mem_ size - ggml_
get_ ⚠name - ggml_
get_ ⚠next_ tensor - ggml_
get_ ⚠no_ alloc - ggml_
get_ ⚠rel_ pos - ggml_
get_ ⚠rows - ggml_
get_ ⚠rows_ back - ggml_
get_ ⚠tensor - ggml_
get_ ⚠type_ traits - ggml_
get_ ⚠type_ traits_ cpu - ggml_
get_ ⚠unary_ op - ggml_
glu ⚠ - ggml_
glu_ ⚠op_ name - ggml_
glu_ ⚠split - ggml_
graph_ ⚠add_ node - ggml_
graph_ ⚠clear - ggml_
graph_ ⚠compute - ggml_
graph_ ⚠compute_ with_ ctx - ggml_
graph_ ⚠cpy - ggml_
graph_ ⚠dump_ dot - ggml_
graph_ ⚠dup - ggml_
graph_ ⚠get_ grad - ggml_
graph_ ⚠get_ grad_ acc - ggml_
graph_ ⚠get_ tensor - ggml_
graph_ ⚠n_ nodes - ggml_
graph_ ⚠node - ggml_
graph_ ⚠nodes - ggml_
graph_ ⚠overhead - ggml_
graph_ ⚠overhead_ custom - ggml_
graph_ ⚠plan - ggml_
graph_ ⚠print - ggml_
graph_ ⚠reset - ggml_
graph_ ⚠size - ggml_
group_ ⚠norm - ggml_
group_ ⚠norm_ inplace - ggml_
guid_ ⚠matches - ggml_
hardsigmoid ⚠ - ggml_
hardswish ⚠ - ggml_
im2col ⚠ - ggml_
im2col_ ⚠back - ggml_
init ⚠ - ggml_
interpolate ⚠ - ggml_
is_ ⚠3d - ggml_
is_ ⚠contiguous - ggml_
is_ ⚠contiguous_ 0 - ggml_
is_ ⚠contiguous_ 1 - ggml_
is_ ⚠contiguous_ 2 - ggml_
is_ ⚠contiguous_ channels - ggml_
is_ ⚠contiguous_ rows - ggml_
is_ ⚠contiguously_ allocated - ggml_
is_ ⚠empty - ggml_
is_ ⚠matrix - ggml_
is_ ⚠numa - ggml_
is_ ⚠permuted - ggml_
is_ ⚠quantized - ggml_
is_ ⚠scalar - ggml_
is_ ⚠transposed - ggml_
is_ ⚠vector - ggml_
l2_ ⚠norm - ggml_
l2_ ⚠norm_ inplace - ggml_
leaky_ ⚠relu - ggml_
log ⚠ - ggml_
log_ ⚠inplace - ggml_
log_ ⚠set - ggml_
map_ ⚠custom1 - ggml_
map_ ⚠custom2 - ggml_
map_ ⚠custom3 - ggml_
map_ ⚠custom1_ inplace - ggml_
map_ ⚠custom2_ inplace - ggml_
map_ ⚠custom3_ inplace - ggml_
mean ⚠ - ggml_
mul ⚠ - ggml_
mul_ ⚠inplace - ggml_
mul_ ⚠mat - ggml_
mul_ ⚠mat_ id - ggml_
mul_ ⚠mat_ set_ prec - ggml_
n_ ⚠dims - ggml_
nbytes ⚠ - ggml_
nbytes_ ⚠pad - ggml_
neg ⚠ - ggml_
neg_ ⚠inplace - ggml_
nelements ⚠ - ggml_
new_ ⚠buffer - ggml_
new_ ⚠f32 - ggml_
new_ ⚠graph - ggml_
new_ ⚠graph_ custom - ggml_
new_ ⚠i32 - ggml_
new_ ⚠tensor - ggml_
new_ ⚠tensor_ 1d - ggml_
new_ ⚠tensor_ 2d - ggml_
new_ ⚠tensor_ 3d - ggml_
new_ ⚠tensor_ 4d - ggml_
norm ⚠ - ggml_
norm_ ⚠inplace - ggml_
nrows ⚠ - ggml_
numa_ ⚠init - ggml_
op_ ⚠desc - ggml_
op_ ⚠name - ggml_
op_ ⚠symbol - ggml_
opt_ ⚠alloc - ggml_
opt_ ⚠context_ optimizer_ type - ggml_
opt_ ⚠dataset_ data - ggml_
opt_ ⚠dataset_ free - ggml_
opt_ ⚠dataset_ get_ batch - ggml_
opt_ ⚠dataset_ get_ batch_ host - ggml_
opt_ ⚠dataset_ init - ggml_
opt_ ⚠dataset_ labels - ggml_
opt_ ⚠dataset_ ndata - ggml_
opt_ ⚠dataset_ shuffle - ggml_
opt_ ⚠default_ params - ggml_
opt_ ⚠epoch - ggml_
opt_ ⚠epoch_ callback_ progress_ bar - ggml_
opt_ ⚠eval - ggml_
opt_ ⚠fit - ggml_
opt_ ⚠free - ggml_
opt_ ⚠get_ constant_ optimizer_ params - ggml_
opt_ ⚠get_ default_ optimizer_ params - ggml_
opt_ ⚠grad_ acc - ggml_
opt_ ⚠init - ggml_
opt_ ⚠inputs - ggml_
opt_ ⚠labels - ggml_
opt_ ⚠loss - ggml_
opt_ ⚠ncorrect - ggml_
opt_ ⚠optimizer_ name - ggml_
opt_ ⚠outputs - ggml_
opt_ ⚠pred - ggml_
opt_ ⚠prepare_ alloc - ggml_
opt_ ⚠reset - ggml_
opt_ ⚠result_ accuracy - ggml_
opt_ ⚠result_ free - ggml_
opt_ ⚠result_ init - ggml_
opt_ ⚠result_ loss - ggml_
opt_ ⚠result_ ndata - ggml_
opt_ ⚠result_ pred - ggml_
opt_ ⚠result_ reset - ggml_
opt_ ⚠static_ graphs - ggml_
opt_ ⚠step_ adamw - ggml_
opt_ ⚠step_ sgd - ggml_
out_ ⚠prod - ggml_
pad ⚠ - ggml_
pad_ ⚠reflect_ 1d - ggml_
permute ⚠ - ggml_
pool_ ⚠1d - ggml_
pool_ ⚠2d - ggml_
pool_ ⚠2d_ back - ggml_
print_ ⚠object - ggml_
print_ ⚠objects - ggml_
quantize_ ⚠chunk - ggml_
quantize_ ⚠free - ggml_
quantize_ ⚠init - ggml_
quantize_ ⚠requires_ imatrix - ggml_
reglu ⚠ - ggml_
reglu_ ⚠split - ggml_
reglu_ ⚠swapped - ggml_
relu ⚠ - ggml_
relu_ ⚠inplace - ggml_
repeat ⚠ - ggml_
repeat_ ⚠4d - ggml_
repeat_ ⚠back - ggml_
reset ⚠ - ggml_
reshape ⚠ - ggml_
reshape_ ⚠1d - ggml_
reshape_ ⚠2d - ggml_
reshape_ ⚠3d - ggml_
reshape_ ⚠4d - ggml_
rms_ ⚠norm - ggml_
rms_ ⚠norm_ back - ggml_
rms_ ⚠norm_ inplace - ggml_
roll ⚠ - ggml_
rope ⚠ - ggml_
rope_ ⚠custom - ggml_
rope_ ⚠custom_ inplace - ggml_
rope_ ⚠ext - ggml_
rope_ ⚠ext_ back - ggml_
rope_ ⚠ext_ inplace - ggml_
rope_ ⚠inplace - ggml_
rope_ ⚠multi - ggml_
rope_ ⚠multi_ back - ggml_
rope_ ⚠multi_ inplace - ggml_
rope_ ⚠yarn_ corr_ dims - ggml_
row_ ⚠size - ggml_
rwkv_ ⚠wkv6 - ggml_
rwkv_ ⚠wkv7 - ggml_
scale ⚠ - ggml_
scale_ ⚠bias - ggml_
scale_ ⚠bias_ inplace - ggml_
scale_ ⚠inplace - ggml_
set ⚠ - ggml_
set_ ⚠1d - ggml_
set_ ⚠1d_ inplace - ggml_
set_ ⚠2d - ggml_
set_ ⚠2d_ inplace - ggml_
set_ ⚠abort_ callback - ggml_
set_ ⚠f32 - ggml_
set_ ⚠f32_ 1d - ggml_
set_ ⚠f32_ nd - ggml_
set_ ⚠i32 - ggml_
set_ ⚠i32_ 1d - ggml_
set_ ⚠i32_ nd - ggml_
set_ ⚠inplace - ggml_
set_ ⚠input - ggml_
set_ ⚠loss - ggml_
set_ ⚠name - ggml_
set_ ⚠no_ alloc - ggml_
set_ ⚠output - ggml_
set_ ⚠param - ggml_
set_ ⚠rows - ggml_
set_ ⚠zero - ggml_
sgn ⚠ - ggml_
sgn_ ⚠inplace - ggml_
sigmoid ⚠ - ggml_
sigmoid_ ⚠inplace - ggml_
silu ⚠ - ggml_
silu_ ⚠back - ggml_
silu_ ⚠inplace - ggml_
sin ⚠ - ggml_
sin_ ⚠inplace - ggml_
soft_ ⚠max - ggml_
soft_ ⚠max_ add_ sinks - ggml_
soft_ ⚠max_ ext - ggml_
soft_ ⚠max_ ext_ back - ggml_
soft_ ⚠max_ ext_ back_ inplace - ggml_
soft_ ⚠max_ inplace - ggml_
sqr ⚠ - ggml_
sqr_ ⚠inplace - ggml_
sqrt ⚠ - ggml_
sqrt_ ⚠inplace - ggml_
ssm_ ⚠conv - ggml_
ssm_ ⚠scan - ggml_
status_ ⚠to_ string - ggml_
step ⚠ - ggml_
step_ ⚠inplace - ggml_
sub ⚠ - ggml_
sub_ ⚠inplace - ggml_
sum ⚠ - ggml_
sum_ ⚠rows - ggml_
swiglu ⚠ - ggml_
swiglu_ ⚠oai - ggml_
swiglu_ ⚠split - ggml_
swiglu_ ⚠swapped - ggml_
tallocr_ ⚠alloc - ggml_
tallocr_ ⚠new - ggml_
tanh ⚠ - ggml_
tanh_ ⚠inplace - ggml_
tensor_ ⚠overhead - ggml_
threadpool_ ⚠free - ggml_
threadpool_ ⚠get_ n_ threads - ggml_
threadpool_ ⚠new - ggml_
threadpool_ ⚠params_ default - ggml_
threadpool_ ⚠params_ init - ggml_
threadpool_ ⚠params_ match - ggml_
threadpool_ ⚠pause - ggml_
threadpool_ ⚠resume - ggml_
time_ ⚠init - ggml_
time_ ⚠ms - ggml_
time_ ⚠us - ggml_
timestep_ ⚠embedding - ggml_
top_ ⚠k - ggml_
transpose ⚠ - ggml_
type_ ⚠name - ggml_
type_ ⚠size - ggml_
type_ ⚠sizef - ggml_
unary ⚠ - ggml_
unary_ ⚠inplace - ggml_
unary_ ⚠op_ name - ggml_
unravel_ ⚠index - ggml_
upscale ⚠ - ggml_
upscale_ ⚠ext - ggml_
used_ ⚠mem - ggml_
validate_ ⚠row_ data - ggml_
version ⚠ - ggml_
view_ ⚠1d - ggml_
view_ ⚠2d - ggml_
view_ ⚠3d - ggml_
view_ ⚠4d - ggml_
view_ ⚠tensor - ggml_
win_ ⚠part - ggml_
win_ ⚠unpart - gguf_
add_ ⚠tensor - gguf_
find_ ⚠key - gguf_
find_ ⚠tensor - gguf_
free ⚠ - gguf_
get_ ⚠alignment - gguf_
get_ ⚠arr_ data - gguf_
get_ ⚠arr_ n - gguf_
get_ ⚠arr_ str - gguf_
get_ ⚠arr_ type - gguf_
get_ ⚠data_ offset - gguf_
get_ ⚠key - gguf_
get_ ⚠kv_ type - gguf_
get_ ⚠meta_ data - gguf_
get_ ⚠meta_ size - gguf_
get_ ⚠n_ kv - gguf_
get_ ⚠n_ tensors - gguf_
get_ ⚠tensor_ name - gguf_
get_ ⚠tensor_ offset - gguf_
get_ ⚠tensor_ size - gguf_
get_ ⚠tensor_ type - gguf_
get_ ⚠val_ bool - gguf_
get_ ⚠val_ data - gguf_
get_ ⚠val_ f32 - gguf_
get_ ⚠val_ f64 - gguf_
get_ ⚠val_ i8 - gguf_
get_ ⚠val_ i16 - gguf_
get_ ⚠val_ i32 - gguf_
get_ ⚠val_ i64 - gguf_
get_ ⚠val_ str - gguf_
get_ ⚠val_ u8 - gguf_
get_ ⚠val_ u16 - gguf_
get_ ⚠val_ u32 - gguf_
get_ ⚠val_ u64 - gguf_
get_ ⚠version - gguf_
init_ ⚠empty - gguf_
init_ ⚠from_ file - gguf_
remove_ ⚠key - gguf_
set_ ⚠arr_ data - gguf_
set_ ⚠arr_ str - gguf_
set_ ⚠kv - gguf_
set_ ⚠tensor_ data - gguf_
set_ ⚠tensor_ type - gguf_
set_ ⚠val_ bool - gguf_
set_ ⚠val_ f32 - gguf_
set_ ⚠val_ f64 - gguf_
set_ ⚠val_ i8 - gguf_
set_ ⚠val_ i16 - gguf_
set_ ⚠val_ i32 - gguf_
set_ ⚠val_ i64 - gguf_
set_ ⚠val_ str - gguf_
set_ ⚠val_ u8 - gguf_
set_ ⚠val_ u16 - gguf_
set_ ⚠val_ u32 - gguf_
set_ ⚠val_ u64 - gguf_
type_ ⚠name - gguf_
write_ ⚠to_ file
Type Aliases§
- FILE
- _IO_
lock_ t - __
off64_ t - __off_t
- ggml_
abort_ callback - ggml_
abort_ callback_ t - ggml_
backend_ buffer_ t - ggml_
backend_ buffer_ type_ t - ggml_
backend_ dev_ get_ extra_ bufts_ t - ggml_
backend_ dev_ t - ggml_
backend_ eval_ callback - ggml_
backend_ event_ t - ggml_
backend_ get_ features_ t - ggml_
backend_ graph_ plan_ t - ggml_
backend_ reg_ t - ggml_
backend_ sched_ eval_ callback - ggml_
backend_ sched_ t - ggml_
backend_ set_ abort_ callback_ t - ggml_
backend_ set_ n_ threads_ t - ggml_
backend_ split_ buffer_ type_ t - ggml_
backend_ t - ggml_
custom1_ op_ t - ggml_
custom2_ op_ t - ggml_
custom3_ op_ t - ggml_
custom_ op_ t - ggml_
fp16_ t - ggml_
from_ float_ t - ggml_
gallocr_ t - ggml_
guid - ggml_
guid_ t - ggml_
log_ callback - ggml_
opt_ context_ t - ggml_
opt_ dataset_ t - ggml_
opt_ epoch_ callback - ggml_
opt_ get_ optimizer_ params - ggml_
opt_ result_ t - ggml_
threadpool_ t - ggml_
to_ float_ t - ggml_
vec_ dot_ t