Mila 0.13.48
Deep Neural Network Library
Loading...
Searching...
No Matches
Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant > Member List

This is the complete list of members for Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >, including all inherited members.

backward(const TensorType &input, const TensorType &output_grad, TensorType &input_grad) constMila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >inline
backward_input_plan_cache_Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >private
backward_weight_plan_Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >private
bias_Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >private
bias_grad_Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >private
build(const BuildContext &build_context) overrideMila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >inlinevirtual
buildCublasLtPlans()Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >inlineprivate
cached_cublaslt_handle_Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >private
cached_in_features_Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >private
cached_outer_size_Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >private
clearGradients() noexceptMila::Dnn::Compute::Operation< DeviceType::Cuda, TComputePrecision >inlinevirtual
compute_type_Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >private
ComputeType typedefMila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >
config_Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >private
context_Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >private
cuda_data_type_Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >private
cuda_weight_data_type_Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >private
CudaExecutionContext typedefMila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >
CudaLinearOp(IExecutionContext *context, const LinearConfig &config)Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >inline
data_typeMila::Dnn::Compute::Operation< DeviceType::Cuda, TComputePrecision >static
DataTypeTraits typedefMila::Dnn::Compute::Operation< DeviceType::Cuda, TComputePrecision >
device_typeMila::Dnn::Compute::Operation< DeviceType::Cuda, TComputePrecision >static
forward(const TensorType &input, TensorType &output) constMila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >inline
forward_plan_cache_Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >private
getActivationCudaDataType() constMila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >inlineprivate
getComputeTypes(cublasComputeType_t &compute_type, cudaDataType_t &scale_type) constMila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >inlineprivate
getConfig() constMila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >inline
getDataType() constMila::Dnn::Compute::Operation< DeviceType::Cuda, TComputePrecision >inlinevirtual
getDeviceType() constMila::Dnn::Compute::Operation< DeviceType::Cuda, TComputePrecision >inlinevirtual
getName() const overrideMila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >inlinevirtual
getOperationType() const overrideMila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >inlinevirtual
getStateMemorySize() constMila::Dnn::Compute::Operation< DeviceType::Cuda, TComputePrecision >inlinevirtual
getWeightCudaDataType() constMila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >inlineprivate
is_built_Mila::Dnn::Compute::Operation< DeviceType::Cuda, TComputePrecision >protected
isBuilt() constMila::Dnn::Compute::Operation< DeviceType::Cuda, TComputePrecision >inlinevirtual
isEvalMode() constMila::Dnn::Compute::Operation< DeviceType::Cuda, TComputePrecision >inlinevirtual
kIsPerChannelQuantizedMila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >static
kIsPerGroupQuantizedMila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >static
kIsQuantizedMila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >static
kUseW8A16GemmMila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >static
kWeightDtypeMila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >static
MR typedefMila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >
out_features_Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >private
quantize(const ITensorBlob &blob, ITensor &weight_out, ITensor &scales_out, const shape_t &expected_shape)Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >inline
scale_type_Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >private
setGradients(ITensor *weight_grad, ITensor *bias_grad) overrideMila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >inlinevirtual
setParameters(ITensor *weight, ITensor *bias) overrideMila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >inlinevirtual
setTrainingMode(TrainingMode training_mode)Mila::Dnn::Compute::Operation< DeviceType::Cuda, TComputePrecision >inlinevirtual
setWeightScales(ITensor *scales)Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >inline
setWeightZeroPoints(ITensor *zero_points)Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >inline
supportsCuBLASLt() constMila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >inlineprivate
TensorType typedefMila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >
training_mode_Mila::Dnn::Compute::Operation< DeviceType::Cuda, TComputePrecision >protected
use_cublaslt_Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >private
use_wmma_fp4_gemm_Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >private
weight_Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >private
weight_grad_Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >private
weight_group_size_Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >private
weight_in_features_Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >private
weight_out_features_Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >private
weight_scales_Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >private
weight_zero_points_Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >private
WeightType typedefMila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >
~CudaLinearOp()=defaultMila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >
~Operation()=defaultMila::Dnn::Compute::Operation< DeviceType::Cuda, TComputePrecision >virtual