12#include <cuda_runtime.h>
31 size_t n, cudaStream_t stream );
38 size_t n, cudaStream_t stream );
45 size_t n, cudaStream_t stream );
52 size_t n, cudaStream_t stream );
59 size_t n, cudaStream_t stream );
66 size_t n, cudaStream_t stream );
82 size_t n, cudaStream_t stream );
89 size_t n, cudaStream_t stream );
96 size_t n, cudaStream_t stream );
103 size_t n, cudaStream_t stream );
114 size_t n, cudaStream_t stream );
121 size_t n, cudaStream_t stream );
128 size_t n, cudaStream_t stream );
Definition Math.Elementwise.h:16
void launch_scalar_subtract_kernel(const T *src, T *dst, T scalar, size_t n, cudaStream_t stream)
Launch scalar subtraction: dst = src - scalar.
void launch_elementwise_less_kernel(const T *src1, const T *src2, T *dst, size_t n, cudaStream_t stream)
Launch element-wise less than: dst = (src1 < src2) ?
void launch_scalar_divide_kernel(const T *src, T *dst, T scalar, size_t n, cudaStream_t stream)
Launch scalar division: dst = src / scalar.
void launch_elementwise_subtract_kernel(const T *src1, const T *src2, T *dst, size_t n, cudaStream_t stream)
Launch element-wise tensor subtraction: dst = src1 - src2.
void launch_elementwise_greater_kernel(const T *src1, const T *src2, T *dst, size_t n, cudaStream_t stream)
Launch element-wise greater than: dst = (src1 > src2) ?
void launch_sqrt_kernel(const T *src, T *dst, size_t n, cudaStream_t stream)
Launch square root: dst = sqrt(src).
void launch_elementwise_multiply_kernel(const T *src1, const T *src2, T *dst, size_t n, cudaStream_t stream)
Launch element-wise tensor multiplication: dst = src1 * src2.
void launch_scalar_add_kernel(const T *src, T *dst, T scalar, size_t n, cudaStream_t stream)
Launch scalar addition: dst = src + scalar.
void launch_elementwise_divide_kernel(const T *src1, const T *src2, T *dst, size_t n, cudaStream_t stream)
Launch element-wise tensor division: dst = src1 / src2.
void launch_square_kernel(const T *src, T *dst, size_t n, cudaStream_t stream)
Launch square: dst = src * src.
void launch_elementwise_min_kernel(const T *src1, const T *src2, T *dst, size_t n, cudaStream_t stream)
Launch element-wise minimum: dst = min(src1, src2).
void launch_negate_kernel(const T *src, T *dst, size_t n, cudaStream_t stream)
Launch negation: dst = -src.
void launch_elementwise_add_kernel(const T *src1, const T *src2, T *dst, size_t n, cudaStream_t stream)
Launch element-wise tensor addition: dst = src1 + src2.
void launch_elementwise_max_kernel(const T *src1, const T *src2, T *dst, size_t n, cudaStream_t stream)
Launch element-wise maximum: dst = max(src1, src2).
void launch_abs_kernel(const T *src, T *dst, size_t n, cudaStream_t stream)
Launch absolute value: dst = abs(src).
void launch_elementwise_equal_kernel(const T *src1, const T *src2, T *dst, size_t n, cudaStream_t stream)
Launch element-wise equality: dst = (src1 == src2) ?
void launch_scalar_multiply_kernel(const T *src, T *dst, T scalar, size_t n, cudaStream_t stream)
Launch scalar multiplication: dst = src * scalar.