llama-cpp-bindings-sys 0.7.0

Low level bindings to llama.cpp
Documentation
1
2
3
4
5
6
7
8
#include "common.cuh"

// Fusion entry point. Caller supplies x/a/inv_b explicitly.
void ggml_cuda_op_snake_fused(ggml_backend_cuda_context & ctx,
                              const ggml_tensor * x,
                              const ggml_tensor * a,
                              const ggml_tensor * inv_b,
                              ggml_tensor *       dst);