cutile 0.0.0-alpha

/*
 * SPDX-FileCopyrightText: Copyright (c) 2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
 * SPDX-License-Identifier: Apache-2.0
 */
mod _conversion;
mod _creation;
///! Pre-built optimized GPU kernels.
///!
///! This module provides a collection of commonly used GPU kernels that are optimized
///! and ready to use. These kernels cover essential operations like tensor creation,
///! type conversion, and linear algebra.
///!
///! ## Available Kernel Modules
///!
///! - [`linalg`] - Linear algebra operations (GEMM, matrix-vector multiplication)
///! - [`creation`] - Tensor creation and initialization (`full`, `arange`)
///! - [`conversion`] - Type conversion operations between tensor element types
///!
///! ## Usage
///!
///! All kernels follow the same usage pattern with `_apply` launcher functions:
///!
///! ```rust,ignore
///! use cutile::api;
///! use cutile::kernels::creation::full_apply;
///!
///! // Create a tensor filled with a value
///! let val = 42.0f32;
///! let tensor = api::zeros([1024]).partition([128]);
///! let result = value((val, tensor))
///!     .apply(full_apply)
///!     .unpartition()
///!     .await;
///! ```
mod _linalg;

pub use _conversion::conversion;
pub use _creation::creation;
pub use _linalg::linalg;