matmul_post

matmul_post(
    a: &Tensor<T>,
    b: &Tensor<T> | Tensor<T>,
    post_op: fn(T) -> T,
    post_op_vec: fn(T::Simd) -> T::Simd,
) -> Result<Tensor<T>, TensorError>

Same as matmul but will perform post operation before writing final result to the memory.

Parameters:

a: First input tensor.

b: Second input tensor.

post_op: post operation function that takes scalar T

post_op_vec: post operation function that takes simd vector T::Simd

Returns:

A new Tensor containing the result of matrix multiplication and post operation

Examples:

use hpt::{
    error::TensorError,
    ops::{MatmulPost, TensorCreator},
    types::math::NormalOutUnary,
    Tensor,
};

fn main() -> Result<(), TensorError> {
    // 2D matrix multiplication
    let a = Tensor::<f64>::new(&[[1., 2.], [3., 4.]]);
    let b = Tensor::<f64>::new(&[[5., 6.], [7., 8.]]);
    let c = a.matmul_post(&b, |x| x._relu(), |x| x._relu())?;
    println!("2D result:\n{}", c);

    // 3D batch matrix multiplication
    let d = Tensor::<f64>::ones(&[2, 2, 3])?; // 2 matrices of shape 2x3
    let e = Tensor::<f64>::ones(&[2, 3, 2])?; // 2 matrices of shape 3x2
    let f = d.matmul_post(&e, |x| x._relu(), |x| x._relu())?; // 2 matrices of shape 2x2
    println!("3D result:\n{}", f);

    Ok(())
}

Backend Support

Backend	Supported
CPU	✅
Cuda	❌