use core::borrow::Borrow;
use slop_air::{Air, BaseAir, PairBuilder};
use slop_algebra::{extension::BinomiallyExtendable, Field, PrimeField32};
use slop_matrix::Matrix;
use slop_maybe_rayon::prelude::{IndexedParallelIterator, ParallelIterator, ParallelSliceMut};
use sp1_derive::AlignedBorrow;
use sp1_hypercube::{
air::{ExtensionAirBuilder, MachineAir},
next_multiple_of_32,
};
use sp1_primitives::SP1Field;
use sp1_recursion_executor::{
Address, Block, ExecutionRecord, ExtAluInstr, ExtAluIo, ExtAluOpcode, Instruction,
RecursionProgram, D,
};
use std::{borrow::BorrowMut, iter::zip, mem::MaybeUninit};
use crate::builder::SP1RecursionAirBuilder;
pub const NUM_EXT_ALU_ENTRIES_PER_ROW: usize = 1;
#[derive(Default, Clone)]
pub struct ExtAluChip;
pub const NUM_EXT_ALU_COLS: usize = core::mem::size_of::<ExtAluCols<u8>>();
#[derive(AlignedBorrow, Debug, Clone, Copy)]
#[repr(C)]
pub struct ExtAluCols<F: Copy> {
pub values: [ExtAluValueCols<F>; NUM_EXT_ALU_ENTRIES_PER_ROW],
}
const NUM_EXT_ALU_VALUE_COLS: usize = core::mem::size_of::<ExtAluValueCols<u8>>();
#[derive(AlignedBorrow, Debug, Clone, Copy)]
#[repr(C)]
pub struct ExtAluValueCols<F: Copy> {
pub vals: ExtAluIo<Block<F>>,
}
pub const NUM_EXT_ALU_PREPROCESSED_COLS: usize = core::mem::size_of::<ExtAluPreprocessedCols<u8>>();
#[derive(AlignedBorrow, Debug, Clone, Copy)]
#[repr(C)]
pub struct ExtAluPreprocessedCols<F: Copy> {
pub accesses: [ExtAluAccessCols<F>; NUM_EXT_ALU_ENTRIES_PER_ROW],
}
pub const NUM_EXT_ALU_ACCESS_COLS: usize = core::mem::size_of::<ExtAluAccessCols<u8>>();
#[derive(AlignedBorrow, Debug, Clone, Copy)]
#[repr(C)]
pub struct ExtAluAccessCols<F: Copy> {
pub addrs: ExtAluIo<Address<F>>,
pub is_add: F,
pub is_sub: F,
pub is_mul: F,
pub is_div: F,
pub mult: F,
}
impl<F: Field> BaseAir<F> for ExtAluChip {
fn width(&self) -> usize {
NUM_EXT_ALU_COLS
}
}
impl<F: PrimeField32 + BinomiallyExtendable<D>> MachineAir<F> for ExtAluChip {
type Record = ExecutionRecord<F>;
type Program = RecursionProgram<F>;
fn name(&self) -> &'static str {
"ExtAlu"
}
fn preprocessed_width(&self) -> usize {
NUM_EXT_ALU_PREPROCESSED_COLS
}
fn preprocessed_num_rows(&self, program: &Self::Program) -> Option<usize> {
let instrs_len = program
.inner
.iter()
.filter_map(|instruction| match instruction.inner() {
Instruction::ExtAlu(x) => Some(x),
_ => None,
})
.count();
self.preprocessed_num_rows_with_instrs_len(program, instrs_len)
}
fn preprocessed_num_rows_with_instrs_len(
&self,
program: &Self::Program,
instrs_len: usize,
) -> Option<usize> {
let height = program.shape.as_ref().and_then(|shape| shape.height(self));
let nb_rows = instrs_len.div_ceil(NUM_EXT_ALU_ENTRIES_PER_ROW);
Some(next_multiple_of_32(nb_rows, height))
}
fn generate_preprocessed_trace_into(
&self,
program: &Self::Program,
buffer: &mut [MaybeUninit<F>],
) {
assert_eq!(
std::any::TypeId::of::<F>(),
std::any::TypeId::of::<SP1Field>(),
"generate_preprocessed_trace only supports SP1Field field"
);
let instrs = program
.inner
.iter()
.filter_map(|instruction| match instruction.inner() {
Instruction::ExtAlu(x) => Some(x),
_ => None,
})
.collect::<Vec<_>>();
let padded_nb_rows =
self.preprocessed_num_rows_with_instrs_len(program, instrs.len()).unwrap();
let buffer_ptr = buffer.as_mut_ptr() as *mut F;
let values = unsafe {
core::slice::from_raw_parts_mut(
buffer_ptr,
padded_nb_rows * NUM_EXT_ALU_PREPROCESSED_COLS,
)
};
unsafe {
let padding_start = instrs.len() * NUM_EXT_ALU_ACCESS_COLS;
let padding_size = padded_nb_rows * NUM_EXT_ALU_PREPROCESSED_COLS - padding_start;
if padding_size > 0 {
core::ptr::write_bytes(buffer[padding_start..].as_mut_ptr(), 0, padding_size);
}
}
let populate_len = instrs.len() * NUM_EXT_ALU_ACCESS_COLS;
values[..populate_len].par_chunks_mut(NUM_EXT_ALU_ACCESS_COLS).zip_eq(instrs).for_each(
|(row, instr)| {
let ExtAluInstr { opcode, mult, addrs } = instr;
let access: &mut ExtAluAccessCols<_> = row.borrow_mut();
*access = ExtAluAccessCols {
addrs: addrs.to_owned(),
is_add: F::from_bool(false),
is_sub: F::from_bool(false),
is_mul: F::from_bool(false),
is_div: F::from_bool(false),
mult: mult.to_owned(),
};
let target_flag = match opcode {
ExtAluOpcode::AddE => &mut access.is_add,
ExtAluOpcode::SubE => &mut access.is_sub,
ExtAluOpcode::MulE => &mut access.is_mul,
ExtAluOpcode::DivE => &mut access.is_div,
};
*target_flag = F::from_bool(true);
},
);
}
fn generate_dependencies(&self, _: &Self::Record, _: &mut Self::Record) {
}
fn num_rows(&self, input: &Self::Record) -> Option<usize> {
let height = input.program.shape.as_ref().and_then(|shape| shape.height(self));
let events = &input.ext_alu_events;
let nb_rows = events.len().div_ceil(NUM_EXT_ALU_ENTRIES_PER_ROW);
Some(next_multiple_of_32(nb_rows, height))
}
fn generate_trace_into(
&self,
input: &ExecutionRecord<F>,
_: &mut ExecutionRecord<F>,
buffer: &mut [MaybeUninit<F>],
) {
assert_eq!(
std::any::TypeId::of::<F>(),
std::any::TypeId::of::<SP1Field>(),
"generate_trace_into only supports SP1Field"
);
let events = &input.ext_alu_events;
let padded_nb_rows = self.num_rows(input).unwrap();
let num_event_rows = events.len();
unsafe {
let padding_start = num_event_rows * NUM_EXT_ALU_COLS;
let padding_size = (padded_nb_rows - num_event_rows) * NUM_EXT_ALU_COLS;
if padding_size > 0 {
core::ptr::write_bytes(buffer[padding_start..].as_mut_ptr(), 0, padding_size);
}
}
let buffer_ptr = buffer.as_mut_ptr() as *mut F;
let values = unsafe {
core::slice::from_raw_parts_mut(buffer_ptr, num_event_rows * NUM_EXT_ALU_COLS)
};
let populate_len = events.len() * NUM_EXT_ALU_VALUE_COLS;
values[..populate_len].par_chunks_mut(NUM_EXT_ALU_VALUE_COLS).zip_eq(events).for_each(
|(row, &vals)| {
let cols: &mut ExtAluValueCols<_> = row.borrow_mut();
*cols = ExtAluValueCols { vals };
},
);
}
fn included(&self, _record: &Self::Record) -> bool {
true
}
}
impl<AB> Air<AB> for ExtAluChip
where
AB: SP1RecursionAirBuilder + PairBuilder,
{
fn eval(&self, builder: &mut AB) {
let main = builder.main();
let local = main.row_slice(0);
let local: &ExtAluCols<AB::Var> = (*local).borrow();
let prep = builder.preprocessed();
let prep_local = prep.row_slice(0);
let prep_local: &ExtAluPreprocessedCols<AB::Var> = (*prep_local).borrow();
for (
ExtAluValueCols { vals },
ExtAluAccessCols { addrs, is_add, is_sub, is_mul, is_div, mult },
) in zip(local.values, prep_local.accesses)
{
let in1 = vals.in1.as_extension::<AB>();
let in2 = vals.in2.as_extension::<AB>();
let out = vals.out.as_extension::<AB>();
let is_real = is_add + is_sub + is_mul + is_div;
builder.assert_bool(is_real.clone());
builder.when(is_add).assert_ext_eq(in1.clone() + in2.clone(), out.clone());
builder.when(is_sub).assert_ext_eq(in1.clone(), in2.clone() + out.clone());
builder.when(is_mul).assert_ext_eq(in1.clone() * in2.clone(), out.clone());
builder.when(is_div).assert_ext_eq(in1, in2 * out);
builder.receive_block(addrs.in1, vals.in1, is_real.clone());
builder.receive_block(addrs.in2, vals.in2, is_real);
builder.send_block(addrs.out, vals.out, mult);
}
}
}
#[cfg(test)]
mod tests {
use crate::{chips::test_fixtures, test::test_recursion_linear_program};
use rand::{rngs::StdRng, Rng, SeedableRng};
use slop_algebra::{extension::BinomialExtensionField, AbstractExtensionField};
use sp1_recursion_executor::{instruction as instr, ExtAluOpcode, MemAccessKind};
use super::*;
#[tokio::test]
async fn generate_trace() {
let shard = test_fixtures::shard().await;
let trace = ExtAluChip.generate_trace(shard, &mut ExecutionRecord::default());
assert!(trace.height() > test_fixtures::MIN_ROWS);
}
#[tokio::test]
async fn generate_preprocessed_trace() {
let program = &test_fixtures::program_with_input().await.0;
let trace = ExtAluChip.generate_preprocessed_trace(program).unwrap();
assert!(trace.height() > test_fixtures::MIN_ROWS);
}
#[tokio::test]
async fn four_ops() {
use sp1_primitives::SP1Field;
type F = SP1Field;
let mut rng = StdRng::seed_from_u64(0xDEADBEEF);
let mut random_extfelt = move || {
let inner: [F; 4] = core::array::from_fn(|_| rng.sample(rand::distributions::Standard));
BinomialExtensionField::<F, D>::from_base_slice(&inner)
};
let mut addr = 0;
let instructions = (0..1000)
.flat_map(|_| {
let quot = random_extfelt();
let in2 = random_extfelt();
let in1 = in2 * quot;
let alloc_size = 6;
let a = (0..alloc_size).map(|x| x + addr).collect::<Vec<_>>();
addr += alloc_size;
[
instr::mem_ext(MemAccessKind::Write, 4, a[0], in1),
instr::mem_ext(MemAccessKind::Write, 4, a[1], in2),
instr::ext_alu(ExtAluOpcode::AddE, 1, a[2], a[0], a[1]),
instr::mem_ext(MemAccessKind::Read, 1, a[2], in1 + in2),
instr::ext_alu(ExtAluOpcode::SubE, 1, a[3], a[0], a[1]),
instr::mem_ext(MemAccessKind::Read, 1, a[3], in1 - in2),
instr::ext_alu(ExtAluOpcode::MulE, 1, a[4], a[0], a[1]),
instr::mem_ext(MemAccessKind::Read, 1, a[4], in1 * in2),
instr::ext_alu(ExtAluOpcode::DivE, 1, a[5], a[0], a[1]),
instr::mem_ext(MemAccessKind::Read, 1, a[5], quot),
]
})
.collect::<Vec<Instruction<F>>>();
test_recursion_linear_program(instructions).await;
}
}