pub const TILE_ALIGNMENT: usize = 128;
Alignment boundary for tile payloads (128 bytes for GPU memory coalescing)