mod common;
mod highp;
mod lowp;
use crate::fine::common::gradient::linear::SimdLinearKind;
use crate::fine::common::gradient::radial::SimdRadialKind;
use crate::fine::common::gradient::sweep::SimdSweepKind;
use crate::fine::common::gradient::{GradientPainter, calculate_t_vals};
use crate::fine::common::image::{FilteredImagePainter, NNImagePainter, PlainNNImagePainter};
use crate::fine::common::rounded_blurred_rect::BlurredRoundedRectFiller;
use crate::layer_manager::LayerManager;
use crate::peniko::{BlendMode, ImageQuality};
use crate::region::Region;
use crate::util::EncodedImageExt;
use alloc::vec;
use alloc::vec::Vec;
use core::fmt::Debug;
use core::iter;
use vello_common::coarse::{Cmd, CommandAttrs, WideTile};
use vello_common::encode::{
EncodedBlurredRoundedRectangle, EncodedGradient, EncodedImage, EncodedKind, EncodedPaint,
};
use vello_common::fearless_simd::{
Bytes, Simd, SimdBase, SimdFloat, SimdInt, SimdInto, f32x4, f32x8, f32x16, u8x16, u8x32, u32x4,
u32x8,
};
use vello_common::filter_effects::Filter;
use vello_common::kurbo::Affine;
use vello_common::mask::Mask;
use vello_common::paint::{ImageResolver, ImageSource, Paint, PremulColor, Tint};
use vello_common::pixmap::Pixmap;
use vello_common::simd::Splat4thExt;
use vello_common::tile::Tile;
use vello_common::util::f32_to_u8;
pub use highp::F32Kernel;
pub use lowp::U8Kernel;
const PIXEL_CENTER_OFFSET: f64 = 0.5;
pub(crate) const COLOR_COMPONENTS: usize = 4;
pub(crate) const TILE_HEIGHT_COMPONENTS: usize = Tile::HEIGHT as usize * COLOR_COMPONENTS;
pub const SCRATCH_BUF_SIZE: usize =
WideTile::WIDTH as usize * Tile::HEIGHT as usize * COLOR_COMPONENTS;
pub type ScratchBuf<F> = [F; SCRATCH_BUF_SIZE];
pub trait Numeric: Copy + Default + Clone + Debug + PartialEq + Send + Sync + 'static {
const ZERO: Self;
const ONE: Self;
}
impl Numeric for f32 {
const ZERO: Self = 0.0;
const ONE: Self = 1.0;
}
impl Numeric for u8 {
const ZERO: Self = 0;
const ONE: Self = 255;
}
pub trait NumericVec<S: Simd>: Copy + Clone + Send + Sync {
fn from_f32(simd: S, val: f32x16<S>) -> Self;
fn from_u8(simd: S, val: u8x16<S>) -> Self;
}
impl<S: Simd> NumericVec<S> for f32x16<S> {
#[inline(always)]
fn from_f32(_: S, val: Self) -> Self {
val
}
#[inline(always)]
fn from_u8(simd: S, val: u8x16<S>) -> Self {
let converted = u8_to_f32(val);
converted * Self::splat(simd, 1.0 / 255.0)
}
}
impl<S: Simd> NumericVec<S> for u8x16<S> {
#[inline(always)]
fn from_f32(simd: S, val: f32x16<S>) -> Self {
let v1 = f32x16::splat(simd, 255.0);
let v2 = f32x16::splat(simd, 0.5);
let mulled = val.mul_add(v1, v2);
f32_to_u8(mulled)
}
#[inline(always)]
fn from_u8(_: S, val: Self) -> Self {
val
}
}
#[inline(always)]
pub(crate) fn u8_to_f32<S: Simd>(val: u8x16<S>) -> f32x16<S> {
let simd = val.simd;
let zeroes = u8x16::splat(simd, 0);
let zip1 = simd.zip_high_u8x16(val, zeroes);
let zip2 = simd.zip_low_u8x16(val, zeroes);
let p1 = simd
.zip_low_u8x16(zip2, zeroes)
.bitcast::<u32x4<S>>()
.to_float::<f32x4<S>>();
let p2 = simd
.zip_high_u8x16(zip2, zeroes)
.bitcast::<u32x4<S>>()
.to_float::<f32x4<S>>();
let p3 = simd
.zip_low_u8x16(zip1, zeroes)
.bitcast::<u32x4<S>>()
.to_float::<f32x4<S>>();
let p4 = simd
.zip_high_u8x16(zip1, zeroes)
.bitcast::<u32x4<S>>()
.to_float::<f32x4<S>>();
simd.combine_f32x8(simd.combine_f32x4(p1, p2), simd.combine_f32x4(p3, p4))
}
pub trait CompositeType<N: Numeric, S: Simd>: Copy + Clone + Send + Sync {
const LENGTH: usize;
fn from_slice(simd: S, slice: &[N]) -> Self;
fn from_color(simd: S, color: [N; 4]) -> Self;
}
impl<S: Simd> CompositeType<f32, S> for f32x16<S> {
const LENGTH: usize = 16;
#[inline(always)]
fn from_slice(simd: S, slice: &[f32]) -> Self {
<Self as SimdBase<_>>::from_slice(simd, slice)
}
#[inline(always)]
fn from_color(simd: S, color: [f32; 4]) -> Self {
Self::block_splat(f32x4::from_slice(simd, &color[..]))
}
}
impl<S: Simd> CompositeType<u8, S> for u8x32<S> {
const LENGTH: usize = 32;
#[inline(always)]
fn from_slice(simd: S, slice: &[u8]) -> Self {
<Self as SimdBase<_>>::from_slice(simd, slice)
}
#[inline(always)]
fn from_color(simd: S, color: [u8; 4]) -> Self {
u32x8::block_splat(u32x4::splat(simd, u32::from_ne_bytes(color))).to_bytes()
}
}
pub trait FineKernel<S: Simd>: Send + Sync + 'static {
type Numeric: Numeric;
type Composite: CompositeType<Self::Numeric, S>;
type NumericVec: NumericVec<S>;
fn extract_color(color: PremulColor) -> [Self::Numeric; 4];
fn pack(simd: S, region: &mut Region<'_>, blend_buf: &[Self::Numeric]);
fn unpack(simd: S, region: &mut Region<'_>, blend_buf: &mut [Self::Numeric]);
fn filter_layer(
pixmap: &mut Pixmap,
filter: &Filter,
layer_manager: &mut LayerManager,
transform: Affine,
);
fn copy_solid(simd: S, target: &mut [Self::Numeric], color: [Self::Numeric; 4]);
fn gradient_painter<'a>(
simd: S,
gradient: &'a EncodedGradient,
t_vals: &'a [f32],
) -> impl Painter + 'a {
simd.vectorize(
#[inline(always)]
|| GradientPainter::new(simd, gradient, t_vals),
)
}
fn gradient_painter_with_undefined<'a>(
simd: S,
gradient: &'a EncodedGradient,
t_vals: &'a [f32],
) -> impl Painter + 'a {
simd.vectorize(
#[inline(always)]
|| GradientPainter::new(simd, gradient, t_vals),
)
}
fn plain_nn_image_painter<'a>(
simd: S,
image: &'a EncodedImage,
pixmap: &'a Pixmap,
start_x: f64,
start_y: f64,
) -> impl Painter + 'a {
simd.vectorize(
#[inline(always)]
|| PlainNNImagePainter::new(simd, image, pixmap, start_x, start_y),
)
}
fn nn_image_painter<'a>(
simd: S,
image: &'a EncodedImage,
pixmap: &'a Pixmap,
start_x: f64,
start_y: f64,
) -> impl Painter + 'a {
simd.vectorize(
#[inline(always)]
|| NNImagePainter::new(simd, image, pixmap, start_x, start_y),
)
}
fn medium_quality_image_painter<'a>(
simd: S,
image: &'a EncodedImage,
pixmap: &'a Pixmap,
start_x: f64,
start_y: f64,
) -> impl Painter + 'a {
simd.vectorize(
#[inline(always)]
|| FilteredImagePainter::<S, 1>::new(simd, image, pixmap, start_x, start_y),
)
}
fn plain_medium_quality_image_painter<'a>(
simd: S,
image: &'a EncodedImage,
pixmap: &'a Pixmap,
start_x: f64,
start_y: f64,
) -> impl Painter + 'a {
simd.vectorize(
#[inline(always)]
|| FilteredImagePainter::<S, 1>::new(simd, image, pixmap, start_x, start_y),
)
}
fn high_quality_image_painter<'a>(
simd: S,
image: &'a EncodedImage,
pixmap: &'a Pixmap,
start_x: f64,
start_y: f64,
) -> impl Painter + 'a {
simd.vectorize(
#[inline(always)]
|| FilteredImagePainter::<S, 2>::new(simd, image, pixmap, start_x, start_y),
)
}
fn blurred_rounded_rectangle_painter(
simd: S,
rect: &EncodedBlurredRoundedRectangle,
start_x: f64,
start_y: f64,
) -> impl Painter {
simd.vectorize(
#[inline(always)]
|| BlurredRoundedRectFiller::new(simd, rect, start_x, start_y),
)
}
fn apply_mask(simd: S, dest: &mut [Self::Numeric], src: impl Iterator<Item = Self::NumericVec>);
fn apply_painter<'a>(simd: S, dest: &mut [Self::Numeric], painter: impl Painter + 'a);
fn apply_tint(simd: S, dest: &mut [Self::Numeric], tint: &Tint);
fn alpha_composite_solid(
simd: S,
target: &mut [Self::Numeric],
src: [Self::Numeric; 4],
alphas: Option<&[u8]>,
);
fn alpha_composite_buffer(
simd: S,
dest: &mut [Self::Numeric],
src: &[Self::Numeric],
alphas: Option<&[u8]>,
);
fn blend(
simd: S,
dest: &mut [Self::Numeric],
start_x: u16,
start_y: u16,
src: impl Iterator<Item = Self::Composite>,
blend_mode: BlendMode,
alphas: Option<&[u8]>,
mask: Option<&Mask>,
);
}
#[derive(Debug)]
pub struct Fine<S: Simd, T: FineKernel<S>> {
pub(crate) wide_coords: (u16, u16),
pub(crate) blend_buf: Vec<ScratchBuf<T::Numeric>>,
pub(crate) paint_buf: ScratchBuf<T::Numeric>,
pub(crate) f32_buf: Vec<f32>,
pub(crate) simd: S,
}
impl<S: Simd, T: FineKernel<S>> Fine<S, T> {
pub fn new(simd: S) -> Self {
Self {
simd,
wide_coords: (0, 0),
blend_buf: vec![[T::Numeric::ZERO; SCRATCH_BUF_SIZE]],
f32_buf: vec![0.0; SCRATCH_BUF_SIZE / 4],
paint_buf: [T::Numeric::ZERO; SCRATCH_BUF_SIZE],
}
}
pub fn set_coords(&mut self, x: u16, y: u16) {
self.wide_coords = (x, y);
}
pub fn clear(&mut self, premul_color: PremulColor) {
let converted_color = T::extract_color(premul_color);
let blend_buf = self.blend_buf.last_mut().unwrap();
T::copy_solid(self.simd, blend_buf, converted_color);
}
pub fn pack(&self, region: &mut Region<'_>) {
let blend_buf = self.blend_buf.last().unwrap();
T::pack(self.simd, region, blend_buf);
}
pub fn unpack(&mut self, region: &mut Region<'_>) {
let blend_buf = self.blend_buf.last_mut().unwrap();
T::unpack(self.simd, region, blend_buf);
}
pub fn filter_layer(
&self,
pixmap: &mut Pixmap,
filter: &Filter,
layer_manager: &mut LayerManager,
transform: Affine,
) {
T::filter_layer(pixmap, filter, layer_manager, transform);
}
pub(crate) fn run_cmd(
&mut self,
cmd: &Cmd,
alphas: &[u8],
paints: &[EncodedPaint],
image_resolver: &dyn ImageResolver,
attrs: &CommandAttrs,
) {
match cmd {
Cmd::Fill(f) => {
let fill_attrs = &attrs.fill[f.attrs_idx as usize];
self.fill(
usize::from(f.x),
usize::from(f.width),
&fill_attrs.paint,
fill_attrs.blend_mode,
paints,
image_resolver,
None,
fill_attrs.mask.as_ref(),
);
}
Cmd::AlphaFill(s) => {
let fill_attrs = &attrs.fill[s.attrs_idx as usize];
let alpha_idx = fill_attrs.alpha_idx(s.alpha_offset) as usize;
self.fill(
usize::from(s.x),
usize::from(s.width),
&fill_attrs.paint,
fill_attrs.blend_mode,
paints,
image_resolver,
Some(&alphas[alpha_idx..]),
fill_attrs.mask.as_ref(),
);
}
Cmd::Filter(_filter, _) => {
}
Cmd::PushBuf(_layer_kind, _) => {
self.blend_buf.push([T::Numeric::ZERO; SCRATCH_BUF_SIZE]);
}
Cmd::PopBuf => {
self.blend_buf.pop();
}
Cmd::ClipFill(cf) => {
self.clip(cf.x as usize, cf.width as usize, None);
}
Cmd::ClipStrip(cs) => {
let clip_attrs = &attrs.clip[cs.attrs_idx as usize];
let alpha_idx = clip_attrs.alpha_idx(cs.alpha_offset) as usize;
self.clip(cs.x as usize, cs.width as usize, Some(&alphas[alpha_idx..]));
}
Cmd::Blend(b) => self.blend(*b),
Cmd::Mask(m) => {
let start_x = self.wide_coords.0 * WideTile::WIDTH;
let start_y = self.wide_coords.1 * Tile::HEIGHT;
let blend_buf = self.blend_buf.last_mut().unwrap();
let width = (blend_buf.len() / (Tile::HEIGHT as usize * COLOR_COMPONENTS)) as u16;
let y = start_y as u32 + u32x4::from_slice(self.simd, &[0, 1, 2, 3]);
let iter = (start_x..(start_x + width)).map(|x| {
let x_in_range = x < m.width();
macro_rules! sample {
($idx:expr) => {
if x_in_range && (y[$idx] as u16) < m.height() {
m.sample(x, y[$idx] as u16)
} else {
0
}
};
}
let s1 = sample!(0);
let s2 = sample!(1);
let s3 = sample!(2);
let s4 = sample!(3);
let samples = u8x16::from_slice(
self.simd,
&[
s1, s1, s1, s1, s2, s2, s2, s2, s3, s3, s3, s3, s4, s4, s4, s4,
],
);
T::NumericVec::from_u8(self.simd, samples)
});
T::apply_mask(self.simd, blend_buf, iter);
}
Cmd::Opacity(o) => {
if *o != 1.0 {
let blend_buf = self.blend_buf.last_mut().unwrap();
T::apply_mask(
self.simd,
blend_buf,
iter::repeat(T::NumericVec::from_f32(
self.simd,
f32x16::splat(self.simd, *o),
)),
);
}
}
Cmd::PushZeroClip(_) | Cmd::PopZeroClip => {
unreachable!();
}
Cmd::BatchEnd => {}
}
}
pub fn fill(
&mut self,
x: usize,
width: usize,
fill: &Paint,
blend_mode: BlendMode,
encoded_paints: &[EncodedPaint],
image_resolver: &dyn ImageResolver,
alphas: Option<&[u8]>,
mask: Option<&Mask>,
) {
let blend_buf = &mut self.blend_buf.last_mut().unwrap()[x * TILE_HEIGHT_COMPONENTS..]
[..TILE_HEIGHT_COMPONENTS * width];
let default_blend = blend_mode == BlendMode::default();
match fill {
Paint::Solid(color) => {
let color = T::extract_color(*color);
if color[3] == T::Numeric::ONE
&& default_blend
&& alphas.is_none()
&& mask.is_none()
{
T::copy_solid(self.simd, blend_buf, color);
return;
}
if default_blend && mask.is_none() {
T::alpha_composite_solid(self.simd, blend_buf, color, alphas);
} else {
let start_x = self.wide_coords.0 * WideTile::WIDTH + x as u16;
let start_y = self.wide_coords.1 * Tile::HEIGHT;
T::blend(
self.simd,
blend_buf,
start_x,
start_y,
iter::repeat(T::Composite::from_color(self.simd, color)),
blend_mode,
alphas,
mask,
);
}
}
Paint::Indexed(paint) => {
let color_buf = &mut self.paint_buf[x * TILE_HEIGHT_COMPONENTS..]
[..TILE_HEIGHT_COMPONENTS * width];
let encoded_paint = &encoded_paints[paint.index()];
let start_x = self.wide_coords.0 * WideTile::WIDTH + x as u16;
let start_y = self.wide_coords.1 * Tile::HEIGHT;
let sampler_x = start_x as f64 + PIXEL_CENTER_OFFSET;
let sampler_y = start_y as f64 + PIXEL_CENTER_OFFSET;
macro_rules! fill_complex_paint {
($may_have_opacities:expr, $filler:expr) => {
fill_complex_paint!($may_have_opacities, $filler, None::<&Tint>)
};
($may_have_opacities:expr, $filler:expr, $tint:expr) => {
if $may_have_opacities || alphas.is_some() {
T::apply_painter(self.simd, color_buf, $filler);
if let Some(t) = $tint {
T::apply_tint(self.simd, color_buf, t);
}
if default_blend && mask.is_none() {
T::alpha_composite_buffer(self.simd, blend_buf, color_buf, alphas);
} else {
T::blend(
self.simd,
blend_buf,
start_x,
start_y,
color_buf
.chunks_exact(T::Composite::LENGTH)
.map(|s| T::Composite::from_slice(self.simd, s)),
blend_mode,
alphas,
mask,
);
}
} else {
T::apply_painter(self.simd, blend_buf, $filler);
if let Some(t) = $tint {
T::apply_tint(self.simd, blend_buf, t);
}
}
};
}
match encoded_paint {
EncodedPaint::BlurredRoundedRect(b) => {
fill_complex_paint!(
true,
T::blurred_rounded_rectangle_painter(
self.simd, b, sampler_x, sampler_y
)
);
}
EncodedPaint::Gradient(g) => {
let f32_buf = &mut self.f32_buf[..width * Tile::HEIGHT as usize];
match &g.kind {
EncodedKind::Linear(l) => {
calculate_t_vals(
self.simd,
SimdLinearKind::new(self.simd, *l),
f32_buf,
g,
sampler_x,
sampler_y,
);
fill_complex_paint!(
g.may_have_opacities,
T::gradient_painter(self.simd, g, f32_buf)
);
}
EncodedKind::Sweep(s) => {
calculate_t_vals(
self.simd,
SimdSweepKind::new(self.simd, s),
f32_buf,
g,
sampler_x,
sampler_y,
);
fill_complex_paint!(
g.may_have_opacities,
T::gradient_painter(self.simd, g, f32_buf)
);
}
EncodedKind::Radial(r) => {
calculate_t_vals(
self.simd,
SimdRadialKind::new(self.simd, r),
f32_buf,
g,
sampler_x,
sampler_y,
);
if r.has_undefined() {
fill_complex_paint!(
g.may_have_opacities,
T::gradient_painter_with_undefined(self.simd, g, f32_buf)
);
} else {
fill_complex_paint!(
g.may_have_opacities,
T::gradient_painter(self.simd, g, f32_buf)
);
}
}
}
}
EncodedPaint::Image(i) => {
let pixmap = match &i.source {
ImageSource::Pixmap(p) => p.clone(),
ImageSource::OpaqueId { id, .. } => image_resolver
.resolve(*id)
.unwrap_or_else(|| panic!("Image {:?} not found in registry", id)),
};
let tint = i.tint.as_ref();
match (i.has_skew(), i.nearest_neighbor()) {
(false, false) => {
if i.sampler.quality == ImageQuality::Medium {
fill_complex_paint!(
i.may_have_opacities,
T::plain_medium_quality_image_painter(
self.simd, i, &pixmap, sampler_x, sampler_y
),
tint
);
} else {
fill_complex_paint!(
i.may_have_opacities,
T::high_quality_image_painter(
self.simd, i, &pixmap, sampler_x, sampler_y
),
tint
);
}
}
(true, false) => {
if i.sampler.quality == ImageQuality::Medium {
fill_complex_paint!(
i.may_have_opacities,
T::medium_quality_image_painter(
self.simd, i, &pixmap, sampler_x, sampler_y
),
tint
);
} else {
fill_complex_paint!(
i.may_have_opacities,
T::high_quality_image_painter(
self.simd, i, &pixmap, sampler_x, sampler_y
),
tint
);
}
}
(false, true) => {
fill_complex_paint!(
i.may_have_opacities,
T::plain_nn_image_painter(
self.simd, i, &pixmap, sampler_x, sampler_y
),
tint
);
}
(true, true) => {
fill_complex_paint!(
i.may_have_opacities,
T::nn_image_painter(
self.simd, i, &pixmap, sampler_x, sampler_y
),
tint
);
}
}
}
}
}
}
}
pub(crate) fn blend(&mut self, blend_mode: BlendMode) {
let (source_buffer, rest) = self.blend_buf.split_last_mut().unwrap();
let target_buffer = rest.last_mut().unwrap();
if blend_mode == BlendMode::default() {
T::alpha_composite_buffer(self.simd, target_buffer, source_buffer, None);
} else {
T::blend(
self.simd,
target_buffer,
0,
0,
source_buffer
.chunks_exact(T::Composite::LENGTH)
.map(|s| T::Composite::from_slice(self.simd, s)),
blend_mode,
None,
None,
);
}
}
fn clip(&mut self, x: usize, width: usize, alphas: Option<&[u8]>) {
let (source_buffer, rest) = self.blend_buf.split_last_mut().unwrap();
let target_buffer = rest.last_mut().unwrap();
let source_buffer =
&mut source_buffer[x * TILE_HEIGHT_COMPONENTS..][..TILE_HEIGHT_COMPONENTS * width];
let target_buffer =
&mut target_buffer[x * TILE_HEIGHT_COMPONENTS..][..TILE_HEIGHT_COMPONENTS * width];
T::alpha_composite_buffer(self.simd, target_buffer, source_buffer, alphas);
}
}
pub trait Painter {
fn paint_u8(&mut self, buf: &mut [u8]);
fn paint_f32(&mut self, buf: &mut [f32]);
}
pub trait PosExt<S: Simd> {
fn splat_pos(simd: S, pos: f32, x_advance: f32, y_advance: f32) -> Self;
}
impl<S: Simd> PosExt<S> for f32x4<S> {
#[inline(always)]
fn splat_pos(simd: S, pos: f32, _: f32, y_advance: f32) -> Self {
let columns: [f32; Tile::HEIGHT as usize] = [0.0, 1.0, 2.0, 3.0];
let column_mask: Self = columns.simd_into(simd);
column_mask.mul_add(Self::splat(simd, y_advance), Self::splat(simd, pos))
}
}
impl<S: Simd> PosExt<S> for f32x8<S> {
#[inline(always)]
fn splat_pos(simd: S, pos: f32, x_advance: f32, y_advance: f32) -> Self {
simd.combine_f32x4(
f32x4::splat_pos(simd, pos, x_advance, y_advance),
f32x4::splat_pos(simd, pos + x_advance, x_advance, y_advance),
)
}
}
pub(crate) struct ShaderResultF32<S: Simd> {
pub(crate) r: f32x8<S>,
pub(crate) g: f32x8<S>,
pub(crate) b: f32x8<S>,
pub(crate) a: f32x8<S>,
}
impl<S: Simd> ShaderResultF32<S> {
#[inline(always)]
pub(crate) fn get(&self) -> (f32x16<S>, f32x16<S>) {
let (r_1, r_2) = self.r.simd.split_f32x8(self.r);
let (g_1, g_2) = self.g.simd.split_f32x8(self.g);
let (b_1, b_2) = self.b.simd.split_f32x8(self.b);
let (a_1, a_2) = self.a.simd.split_f32x8(self.a);
let first = self.r.simd.combine_f32x8(
self.r.simd.combine_f32x4(r_1, g_1),
self.r.simd.combine_f32x4(b_1, a_1),
);
let second = self.r.simd.combine_f32x8(
self.r.simd.combine_f32x4(r_2, g_2),
self.r.simd.combine_f32x4(b_2, a_2),
);
(first, second)
}
}
mod macros {
macro_rules! f32x16_painter {
($($type_path:tt)+) => {
impl<S: Simd> crate::fine::Painter for $($type_path)+ {
fn paint_u8(&mut self, buf: &mut [u8]) {
use vello_common::fearless_simd::*;
use crate::fine::NumericVec;
self.simd.vectorize(#[inline(always)] || {
for chunk in buf.chunks_exact_mut(16) {
let next = self.next().unwrap();
let converted = u8x16::<S>::from_f32(next.simd, next);
chunk.copy_from_slice(converted.as_slice());
}
})
}
fn paint_f32(&mut self, buf: &mut [f32]) {
self.simd.vectorize(#[inline(always)] || {
for chunk in buf.chunks_exact_mut(16) {
let next = self.next().unwrap();
chunk.copy_from_slice(next.as_slice());
}
})
}
}
};
}
macro_rules! u8x16_painter {
($($type_path:tt)+) => {
impl<S: Simd> crate::fine::Painter for $($type_path)+ {
fn paint_u8(&mut self, buf: &mut [u8]) {
self.simd.vectorize(#[inline(always)] || {
for chunk in buf.chunks_exact_mut(16) {
let next = self.next().unwrap();
chunk.copy_from_slice(next.as_slice());
}
})
}
fn paint_f32(&mut self, buf: &mut [f32]) {
use vello_common::fearless_simd::*;
use crate::fine::NumericVec;
self.simd.vectorize(#[inline(always)] || {
for chunk in buf.chunks_exact_mut(16) {
let next = self.next().unwrap();
let converted = f32x16::<S>::from_u8(next.simd, next);
chunk.copy_from_slice(converted.as_slice());
}
})
}
}
};
}
pub(crate) use f32x16_painter;
pub(crate) use u8x16_painter;
}