use vyre::ir::{BufferAccess, BufferDecl, DataType, Expr, Node, Program, UnOp};
use crate::region::wrap_anonymous;
#[must_use]
pub fn swiglu(gate: &str, up: &str, output: &str, n: u32) -> Program {
let i = Expr::var("i");
let g = Expr::load(gate, i.clone());
let u = Expr::load(up, i.clone());
let sigmoid_g = Expr::div(
Expr::f32(1.0),
Expr::add(
Expr::f32(1.0),
Expr::UnOp {
op: UnOp::Exp,
operand: Box::new(Expr::UnOp {
op: UnOp::Negate,
operand: Box::new(g.clone()),
}),
},
),
);
let body = vec![
Node::let_bind("i", Expr::InvocationId { axis: 0 }),
Node::if_then(
Expr::lt(i.clone(), Expr::buf_len(output)),
vec![Node::Store {
buffer: output.into(),
index: i,
value: Expr::mul(g, Expr::mul(u, sigmoid_g)),
}],
),
];
Program::wrapped(
vec![
BufferDecl::storage(gate, 0, BufferAccess::ReadOnly, DataType::F32).with_count(n),
BufferDecl::storage(up, 1, BufferAccess::ReadOnly, DataType::F32).with_count(n),
BufferDecl::output(output, 2, DataType::F32).with_count(n),
],
[64, 1, 1],
vec![wrap_anonymous("vyre-libs::nn::swiglu", body)],
)
}
inventory::submit! {
crate::harness::OpEntry {
id: "vyre-libs::nn::swiglu",
build: || swiglu("gate", "up", "output", 4),
test_inputs: Some(|| {
let to_bytes = vyre_primitives::wire::pack_f32_slice;
vec![vec![
to_bytes(&[0.0_f32, 1.0, -1.0, 2.0]), to_bytes(&[1.0_f32, 2.0, 3.0, 4.0]), ]]
}),
expected_output: Some(|| {
let gate = [0.0_f32, 1.0, -1.0, 2.0];
let up = [1.0_f32, 2.0, 3.0, 4.0];
let out: Vec<f32> = gate.iter().zip(up.iter()).map(|(&g, &u)| {
let sigmoid_g = 1.0 / (1.0 + (-g).exp());
g * u * sigmoid_g
}).collect();
let bytes = vyre_primitives::wire::pack_f32_slice(&out);
vec![vec![bytes]]
}),
category: Some("nn"),
}
}
#[cfg(test)]
mod tests {
use super::*;
use crate::test_support::byte_pack::decode_f32;
use crate::test_support::byte_pack::f32_bytes;
use vyre_reference::value::Value;
fn swiglu_ref(g: f32, u: f32) -> f32 {
let sigmoid_g = 1.0 / (1.0 + (-g).exp());
g * u * sigmoid_g
}
#[test]
fn swiglu_all_zeros() {
let gate = [0.0f32; 4];
let up = [1.0f32; 4];
let program = swiglu("gate", "up", "output", 4);
let outputs = vyre_reference::reference_eval(
&program,
&[
Value::from(f32_bytes(&gate)),
Value::from(f32_bytes(&up)),
Value::from(vec![0u8; 16]),
],
)
.expect("Fix: swiglu all-zeros must execute");
let out = decode_f32(&outputs[0].to_bytes());
assert_eq!(out, vec![0.0; 4]);
}
#[test]
fn swiglu_varied_values() {
let gate = [1.0f32, -1.0, 0.5, -0.5];
let up = [2.0f32, 3.0, 4.0, 5.0];
let program = swiglu("gate", "up", "output", 4);
let outputs = vyre_reference::reference_eval(
&program,
&[
Value::from(f32_bytes(&gate)),
Value::from(f32_bytes(&up)),
Value::from(vec![0u8; 16]),
],
)
.expect("Fix: swiglu varied values must execute");
let out = decode_f32(&outputs[0].to_bytes());
for (i, (&v, (&g, &u))) in out.iter().zip(gate.iter().zip(up.iter())).enumerate() {
let expected = swiglu_ref(g, u);
assert!(
(v - expected).abs() <= 1.0e-5,
"swiglu mismatch at {i}: {v} != {expected}"
);
}
}
#[test]
fn swiglu_empty_tensor() {
let program = swiglu("gate", "up", "output", 0);
let outputs = vyre_reference::reference_eval(
&program,
&[
Value::from(vec![]),
Value::from(vec![]),
Value::from(vec![]),
],
)
.expect("Fix: swiglu n=0 must not panic");
assert!(outputs[0].to_bytes().is_empty());
}
#[test]
fn swiglu_nan_gate_propagates_nan() {
let gate = [f32::NAN];
let up = [1.0f32];
let program = swiglu("gate", "up", "output", 1);
let outputs = vyre_reference::reference_eval(
&program,
&[
Value::from(f32_bytes(&gate)),
Value::from(f32_bytes(&up)),
Value::from(vec![0u8; 4]),
],
)
.expect("Fix: swiglu must not panic on NaN gate");
let out = decode_f32(&outputs[0].to_bytes());
assert!(out[0].is_nan(), "swiglu(NaN gate) must be NaN");
}
}