pub const GPU_BATCH_THRESHOLD: usize = 512;Expand description
Minimum batch size below which GPU offload is not attempted.
Below this threshold the host↔device transfer overhead exceeds the
compute savings. Mirrors tinyquant_gpu_wgpu::GPU_BATCH_THRESHOLD.