use lazy_static::lazy_static;
use crate::access::{AccessBuf, AccessOp};
use crate::host::VEC_MIN_SIZE;
pub use buffer::*;
pub use platform::{OpenCL, ACC_MIN_SIZE, GPU_MIN_SIZE};
mod buffer;
pub mod ops;
mod platform;
mod programs;
const TILE_SIZE: usize = 8;
const WG_SIZE: usize = 64;
lazy_static! {
pub static ref CL_PLATFORM: platform::CLPlatform = {
assert!(VEC_MIN_SIZE < GPU_MIN_SIZE);
assert!(GPU_MIN_SIZE < ACC_MIN_SIZE);
platform::CLPlatform::default().expect("OpenCL platform")
};
}
pub type ArrayBuf<T> = crate::array::Array<T, AccessBuf<ocl::Buffer<T>>, OpenCL>;
pub type ArrayOp<T, O> = crate::array::Array<T, AccessOp<O, OpenCL>, OpenCL>;
#[cfg(test)]
mod tests {
use crate::{
shape, slice, AxisRange, Error, MatrixDual, NDArray, NDArrayCompare, NDArrayMath,
NDArrayRead, NDArrayReduceBoolean, NDArrayTransform, NDArrayWrite, Shape,
};
use super::*;
#[test]
fn test_add() -> Result<(), Error> {
let shape = shape![1, 2, 3];
let left = ArrayBuf::constant(0, shape.clone())?;
let right = ArrayBuf::constant(0, shape.clone())?;
let expected = ArrayBuf::constant(0, shape.clone())?;
let actual = left.add(right)?;
let eq = actual.eq(expected)?;
assert!(eq.all()?);
Ok(())
}
#[test]
fn test_matmul_2x2() -> Result<(), Error> {
let l = ArrayOp::range(0, 4, shape![2, 2])?;
let r = ArrayOp::range(0, 4, shape![2, 2])?;
let actual = l.matmul(r)?;
assert_eq!(actual.shape(), &[2, 2]);
let expected = vec![2, 3, 6, 11];
assert_eq!(actual.buffer()?.to_slice()?.to_vec(), expected);
Ok(())
}
#[test]
fn test_matmul_12x20() -> Result<(), Error> {
let buf = OpenCL::copy_into_buffer(&(0..12).into_iter().collect::<Vec<_>>())?;
let l = ArrayBuf::new(buf, shape![3, 4])?;
let buf = OpenCL::copy_into_buffer(&(0..20).into_iter().collect::<Vec<_>>())?;
let r = ArrayBuf::new(buf, shape![4, 5])?;
let actual = l.matmul(r)?;
assert_eq!(actual.shape(), &[3, 5]);
let expected = vec![
70, 76, 82, 88, 94, 190, 212, 234, 256, 278, 310, 348, 386, 424, 462,
];
assert_eq!(actual.buffer()?.to_slice()?.to_vec(), expected);
Ok(())
}
#[test]
fn test_matmul_large() -> Result<(), Error> {
let shapes: Vec<(Shape, Shape, Shape)> = vec![
(shape![2, 3], shape![3, 4], shape![2, 4]),
(shape![9, 7], shape![7, 12], shape![9, 12]),
(shape![16, 8], shape![8, 24], shape![16, 24]),
(shape![2, 9], shape![9, 1], shape![2, 1]),
(shape![16, 8], shape![8, 32], shape![16, 32]),
(shape![2, 15, 26], shape![2, 26, 37], shape![2, 15, 37]),
(shape![3, 15, 26], shape![3, 26, 37], shape![3, 15, 37]),
(shape![8, 44, 1], shape![8, 1, 98], shape![8, 44, 98]),
];
let queue = OpenCL::queue(GPU_MIN_SIZE, &[])?;
for (left_shape, right_shape, output_shape) in shapes {
let left = ocl::Buffer::builder()
.queue(queue.clone())
.len(left_shape.iter().product::<usize>())
.fill_val(1.)
.build()?;
let right = ocl::Buffer::builder()
.queue(queue.clone())
.len(right_shape.iter().product::<usize>())
.fill_val(1.)
.build()?;
let left = ArrayBuf::new(left, left_shape)?;
let right = ArrayBuf::new(right, right_shape)?;
let expected = *left.shape().last().unwrap();
let actual = left.matmul(right)?;
assert_eq!(actual.shape(), output_shape.as_slice());
let actual = actual.buffer()?.to_slice()?;
assert!(
actual.iter().copied().all(|n| n == expected as f32),
"expected {expected} but found {actual:?}"
);
queue.flush()?;
}
Ok(())
}
#[test]
fn test_sub() -> Result<(), Error> {
let shape = shape![1, 2, 3];
let buffer = OpenCL::copy_into_buffer(&[0, 1, 2, 3, 4, 5])?;
let array = ArrayBuf::new(buffer, shape.clone())?;
let actual = array.as_ref().sub(array.as_ref())?;
assert!(!actual.any()?);
Ok(())
}
#[test]
fn test_slice() -> Result<(), Error> {
let buf = OpenCL::copy_into_buffer(&[0; 6])?;
let array = ArrayBuf::new(buf, shape![2, 3])?;
let mut slice = array.slice(slice![AxisRange::In(0, 2, 1), AxisRange::At(1)])?;
let buf = OpenCL::copy_into_buffer(&[0, 0])?;
let zeros = ArrayBuf::new(buf, shape![2])?;
let buf = OpenCL::copy_into_buffer(&[0, 0])?;
let ones = ArrayBuf::new(buf, shape![2])?;
assert!(slice.as_ref().eq(zeros)?.all()?);
slice.write(&ones)?;
Ok(())
}
}