Here is a list of all class members with links to the classes they belong to:
- a -
- acquire() : Mila::Dnn::Compute::Cuda::Rope::RopeCacheRegistry
- activation : Mila::Dnn::Serialization::PretrainedMetadata
- activation_ : Mila::Dnn::MLP< TDeviceType, TPrecision >
- activation_backward_ : Mila::Dnn::MLP< TDeviceType, TPrecision >
- activation_forward_ : Mila::Dnn::MLP< TDeviceType, TPrecision >
- activation_type_ : Mila::Dnn::GptBlockConfig, Mila::Dnn::MLPConfig
- ActivationBackwardFn : Mila::Dnn::MLP< TDeviceType, TPrecision >
- ActivationBase : Mila::Dnn::MLP< TDeviceType, TPrecision >
- activationChildName() : Mila::Dnn::MLP< TDeviceType, TPrecision >
- ActivationComponentBase : Mila::Dnn::Detail::mlp_activation_impl< ActivationType::Gelu, TDeviceType, TPrecision >, Mila::Dnn::Detail::mlp_activation_impl< ActivationType::Swiglu, TDeviceType, TPrecision >
- ActivationComponentType : Mila::Dnn::Detail::mlp_activation_impl< ActivationType::Gelu, TDeviceType, TPrecision >, Mila::Dnn::Detail::mlp_activation_impl< ActivationType::Swiglu, TDeviceType, TPrecision >
- ActivationForwardFn : Mila::Dnn::MLP< TDeviceType, TPrecision >
- ActivationType : Mila::Dnn::Compute::Cuda::CublasLtLinearPlan< TComputePrecision, TParameterPrecision >
- active_ : Mila::Dnn::Serialization::ModelArchive::ScopedScope
- active_max_seq_len_ : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::CudaMultiHeadAttentionOp< TPrecision >
- AdamWOptimizer() : Mila::Dnn::Optimizers::AdamWOptimizer< TDeviceType, TPrecision >
- add() : Mila::Dnn::Compute::Cpu::MathOps, Mila::Dnn::Compute::Cuda::MathOps
- addActivation() : Mila::Dnn::MLP< TDeviceType, TPrecision >
- addComponent() : Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >
- addCorpus() : Mila::Data::TokenizerTrainer
- addCorpusFromFile() : Mila::Data::BpeTrainer, Mila::Data::CharTrainer, Mila::Data::TokenizerTrainer
- addCorpusFromStream() : Mila::Data::BpeTrainer, Mila::Data::CharTrainer, Mila::Data::TokenizerTrainer
- addData() : Mila::Dnn::Serialization::ArchiveSerializer, Mila::Dnn::Serialization::ZipSerializer
- addImpl() : Mila::Dnn::Compute::Cuda::MathOps
- addLinear() : Mila::Dnn::MLP< TDeviceType, TPrecision >
- addMetadata() : Mila::Dnn::Serialization::ArchiveSerializer, Mila::Dnn::Serialization::ModelArchive, Mila::Dnn::Serialization::ZipSerializer
- addParameter() : Mila::Dnn::Compute::CpuAdamWOptimizer< TPrecision >, Mila::Dnn::Compute::CudaAdamWOptimizer< TPrecision >, Mila::Dnn::Compute::Optimizer< TDeviceType, TPrecision >, Mila::Dnn::Optimizers::AdamWOptimizer< TDeviceType, TPrecision >
- addRegularTokens() : Mila::Data::CharVocabulary
- addSpecialToken() : Mila::Data::BpeVocabulary
- addSpecialTokensFromConfig() : Mila::Data::BpeVocabulary, Mila::Data::CharVocabulary
- algorithm : Mila::Dnn::Compute::Cuda::CublasLtLinearPlan< TComputePrecision, TParameterPrecision >, Mila::Dnn::Compute::Cuda::CublasLtMatMulPlan< TComputePrecision >
- aligned_size_ : Mila::Dnn::TensorBuffer< TDataType, TMemoryResource, TrackMemory >
- alignedSize() : Mila::Dnn::TensorBuffer< TDataType, TMemoryResource, TrackMemory >
- alignment : Mila::Dnn::TensorBuffer< TDataType, TMemoryResource, TrackMemory >, Mila::Dnn::TensorDataTypeTraits< TensorDataType::BF16 >, Mila::Dnn::TensorDataTypeTraits< TensorDataType::FP16 >, Mila::Dnn::TensorDataTypeTraits< TensorDataType::FP32 >, Mila::Dnn::TensorDataTypeTraits< TensorDataType::FP4_E2M1 >, Mila::Dnn::TensorDataTypeTraits< TensorDataType::FP4_E3M0 >, Mila::Dnn::TensorDataTypeTraits< TensorDataType::FP8_E4M3 >, Mila::Dnn::TensorDataTypeTraits< TensorDataType::FP8_E5M2 >, Mila::Dnn::TensorDataTypeTraits< TensorDataType::INT16 >, Mila::Dnn::TensorDataTypeTraits< TensorDataType::INT32 >, Mila::Dnn::TensorDataTypeTraits< TensorDataType::INT8 >, Mila::Dnn::TensorDataTypeTraits< TensorDataType::UINT16 >, Mila::Dnn::TensorDataTypeTraits< TensorDataType::UINT32 >, Mila::Dnn::TensorDataTypeTraits< TensorDataType::UINT8 >
- allocateBuffer() : Mila::Dnn::Tensor< TDataType, TMemoryResource >
- allocateBuffers() : Mila::Data::TokenSequenceLoader< TMemoryResource >
- allocateParameters() : Mila::Dnn::RmsNorm< TDeviceType, TPrecision >
- allocateStateTensors() : Mila::Dnn::Compute::CpuAttentionOp, Mila::Dnn::Compute::Cuda::MultiHeadAttention::CudaMultiHeadAttentionOp< TPrecision >
- allocateStatisticsTensors() : Mila::Dnn::Compute::CpuLayerNormOp
- allocationCount : Mila::Dnn::Compute::MemoryStats
- AllocationStrategy : Mila::Dnn::Compute::VulkanMemoryResource
- applyMergeAndUpdateCounts() : Mila::Data::BpeVocabulary
- applySoftmax() : Mila::Dnn::Compute::CpuAttentionOp
- approximation_method_ : Mila::Dnn::GeluConfig
- architecture : Mila::Dnn::Serialization::PretrainedMetadata
- archive_ : Mila::Dnn::Serialization::ModelArchive::ScopedScope
- asInputA() : Mila::Dnn::Compute::PairedOperation< TDeviceType, TPrecision, TInputA, TInputB >
- asInputB() : Mila::Dnn::Compute::PairedOperation< TDeviceType, TPrecision, TInputA, TInputB >
- asInputTensor() : Mila::Dnn::Compute::UnaryOperation< TDeviceType, TInput, TPrecision >
- asLeftTensor() : Mila::Dnn::Compute::BinaryOperation< TDeviceType, TPrecision, TInputA, TInputB >
- asOutputTensor() : Mila::Dnn::Compute::BinaryOperation< TDeviceType, TPrecision, TInputA, TInputB >, Mila::Dnn::Compute::PairedOperation< TDeviceType, TPrecision, TInputA, TInputB >, Mila::Dnn::Compute::UnaryOperation< TDeviceType, TInput, TPrecision >
- asRightTensor() : Mila::Dnn::Compute::BinaryOperation< TDeviceType, TPrecision, TInputA, TInputB >
- att : Mila::Dnn::Compute::GqaState
- att_ : Mila::Dnn::Compute::CpuAttentionOp, Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::CudaMultiHeadAttentionOp< TPrecision >
- att_decode : Mila::Dnn::Compute::GqaState
- att_decode_ : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::CudaMultiHeadAttentionOp< TPrecision >
- att_decode_opt_ : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >
- att_decode_tensor_ : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::CudaMultiHeadAttentionOp< TPrecision >
- att_opt_ : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >
- att_tensor_ : Mila::Dnn::Compute::CpuAttentionOp, Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::CudaMultiHeadAttentionOp< TPrecision >
- att_tensor_optimized_ : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >
- att_value_decode_plan_ : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::CudaMultiHeadAttentionOp< TPrecision >
- att_value_decode_plan_optimized_ : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >
- att_value_partial_prefill_plan_cache_ : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >
- att_value_partial_prefill_plan_cache_optimized_ : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >
- att_value_plan_ : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::CudaMultiHeadAttentionOp< TPrecision >
- att_value_prefill_plan_ : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >
- att_value_prefill_plan_optimized_ : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >
- attention_type : Mila::Dnn::Serialization::PretrainedMetadata
- AttentionType : Mila::Dnn::GptBlock< TDeviceType, TPrecision >, Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >
- attn_ : Mila::Dnn::GptBlock< TDeviceType, TPrecision >, Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >
- attn_heads : Mila::Dnn::Visualization::VisualizerContext
- automatic_migration : Mila::Dnn::Compute::MemoryResourceTraits< CudaManagedMemoryResource >
- axis_ : Mila::Dnn::Compute::CpuLayerNormOp, Mila::Dnn::LayerNormConfig, Mila::Dnn::RmsNormConfig, Mila::Dnn::SoftmaxConfig
- axis_size : Mila::Dnn::AxisPartition