1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
pub mod nn;

mod arithmetic;
mod assign;
mod clip;
mod col_op;
mod diagflat;
mod fns;
mod gemm;
mod max;
mod random;
mod row_op;
mod scalar;
mod sum;
mod transpose;

pub use arithmetic::*;
pub use assign::*;
pub use clip::*;
pub use col_op::*;
pub use diagflat::*;
pub use fns::*;
pub use gemm::*;
pub use max::*;
pub use random::*;
pub use row_op::*;
pub use scalar::*;
pub use sum::*;
pub use transpose::*;

#[cfg(feature = "opencl")]
use crate::Matrix;
#[cfg(feature = "opencl")]
use custos::cpu::CPU;

#[cfg(feature = "opencl")]
use custos::CLDevice;

#[cfg(feature = "opencl")]
///OpenCL
pub fn cl_to_cpu_lr<'a, 'o, T, F>(
    device: &'a CLDevice,
    lhs: &Matrix<T>,
    rhs: &Matrix<T>,
    f: F,
) -> Matrix<'a, T>
where
    T: Copy + Default + std::fmt::Debug,
    F: for<'b> Fn(&'b CPU, &Matrix<T>, &Matrix<T>) -> Matrix<'b, T>,
{
    use crate::opencl::cpu_exec_lhs_rhs;
    cpu_exec_lhs_rhs(device, lhs, rhs, f).unwrap()
}

#[cfg(feature = "opencl")]
///OpenCL
pub fn cl_to_cpu_s<'a, 'o, T, F>(device: &'o CLDevice, x: &Matrix<'a, T>, f: F) -> Matrix<'o, T>
where
    T: Copy + Default + std::fmt::Debug,
    F: for<'b> Fn(&'b CPU, &Matrix<'_, T>) -> Matrix<'b, T>,
{
    use crate::opencl::cpu_exec;
    cpu_exec(device, x, &f).unwrap()
}

#[cfg(feature = "opencl")]
///OpenCL
fn cl_to_cpu_scalar<T: Default + Copy, F: Fn(&CPU, &Matrix<T>) -> T>(
    device: &CLDevice,
    x: &Matrix<T>,
    f: F,
) -> T {
    use crate::opencl::cpu_exec_scalar;
    cpu_exec_scalar(device, x, f)
}