Here is a list of all functions with links to the classes they belong to:
- g -
- Gelu() : Mila::Dnn::Gelu< TDeviceType, TPrecision >
- generate() : Mila::Dnn::LanguageModel< TDeviceType, TPrecision >
- generateMask() : Mila::Dnn::Dropout< TDeviceType, TInput, TOutput >
- generateStreaming() : Mila::Dnn::LanguageModel< TDeviceType, TPrecision >
- get() : Mila::Dnn::Compute::Cuda::CublasLtPlanCache< TPlan >
- get_native_type() : Mila::Dnn::VulkanTensorTraits
- getActivationCudaDataType() : Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >
- getActivationType() : Mila::Dnn::GptBlockConfig, Mila::Dnn::MLPConfig
- getApproximationMethod() : Mila::Dnn::Gelu< TDeviceType, TPrecision >, Mila::Dnn::GeluConfig
- getAxis() : Mila::Dnn::LayerNormConfig, Mila::Dnn::RmsNormConfig, Mila::Dnn::Softmax< TDeviceType, TPrecision >, Mila::Dnn::SoftmaxConfig
- getBase() : Mila::Dnn::RopeConfig
- getBeta1() : Mila::Dnn::Compute::CpuAdamWOptimizer< TPrecision >, Mila::Dnn::Compute::CudaAdamWOptimizer< TPrecision >, Mila::Dnn::Optimizers::AdamWConfig, Mila::Dnn::Optimizers::AdamWOptimizer< TDeviceType, TPrecision >
- getBeta2() : Mila::Dnn::Compute::CpuAdamWOptimizer< TPrecision >, Mila::Dnn::Compute::CudaAdamWOptimizer< TPrecision >, Mila::Dnn::Optimizers::AdamWConfig, Mila::Dnn::Optimizers::AdamWOptimizer< TDeviceType, TPrecision >
- getBool() : Mila::Data::SerializationMetadata, Mila::Dnn::Optimizers::SerializationMetadata, Mila::Dnn::Serialization::SerializationMetadata, Mila::Dnn::SerializationMetadata
- getBosTokenId() : Mila::Data::BpeTokenizer, Mila::Data::CharTokenizer, Mila::Data::Tokenizer
- getBufferString() : Mila::Dnn::Tensor< TDataType, TMemoryResource >
- getByteDecoder() : Mila::Data::BpeVocabulary
- getByteEncoder() : Mila::Data::BpeVocabulary
- getCommandQueue() : Mila::Dnn::Compute::ExecutionContext< DeviceType::Metal >
- getComponent() : Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >
- getComponentAs() : Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >
- getComponentName() : Mila::Dnn::ComponentFactory
- getComponents() : Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >
- getComponentVersion() : Mila::Dnn::ComponentFactory
- getComputeCapability() : Mila::Dnn::Compute::CudaDevice, Mila::Dnn::Compute::CudaDeviceProps
- getComputeCapabilityVersion() : Mila::Dnn::Compute::CudaDevice
- getComputeTypes() : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >, Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::CudaMultiHeadAttentionOp< TPrecision >
- getConfig() : Mila::Data::BpeTrainer, Mila::Data::BpeVocabulary, Mila::Data::CharTrainer, Mila::Data::CharVocabulary, Mila::Dnn::Compute::CpuLinearOp, Mila::Dnn::Compute::CpuSoftmaxCrossEntropyOp< TPrecision, TLogits, TTargets >, Mila::Dnn::Compute::CpuSoftmaxOp, Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >, Mila::Dnn::Compute::Cuda::LayerNorm::CudaLayerNormOp< TPrecision >, Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::CudaMultiHeadAttentionOp< TPrecision >, Mila::Dnn::Compute::Cuda::RmsNorm::CudaRmsNormOp< TPrecision >, Mila::Dnn::Compute::Cuda::Softmax::CudaSoftmaxOp< TPrecision >, Mila::Dnn::Compute::Cuda::SoftmaxCrossEntropy::CudaSoftmaxCrossEntropyOp< TPrecision, TLogits, TTargets >, Mila::Dnn::GptModel< TDeviceType, TPrecision >, Mila::Dnn::GroupedQueryAttention< TDeviceType, TComputePrecision, TKvPolicy >, Mila::Dnn::Linear< TDeviceType, TComputePrecision, TWeightQuant >, Mila::Dnn::LlamaModel< TDeviceType, TPrecision >, Mila::Dnn::MultiHeadAttention< TDeviceType, TPrecision >, Mila::Dnn::SoftmaxCrossEntropy< TDeviceType, TLogits, TTargets, TPrecision >
- getConnectionType() : Mila::Dnn::ResidualConfig
- getContextLength() : Mila::Dnn::LanguageModelConfig< TDerived >, Mila::Dnn::ModelConfig
- getCorpusSize() : Mila::Data::BpeTrainer, Mila::Data::CharTrainer
- getCublasLtHandle() : Mila::Dnn::Compute::ExecutionContext< DeviceType::Cuda >
- getCublasLtWorkspace() : Mila::Dnn::Compute::ExecutionContext< DeviceType::Cuda >
- getCublasLtWorkspaceSize() : Mila::Dnn::Compute::ExecutionContext< DeviceType::Cuda >
- getCudaDataType() : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::CudaMultiHeadAttentionOp< TPrecision >
- getCurandGenerator() : Mila::Dnn::Compute::ExecutionContext< DeviceType::Cuda >
- getCurrentTimestamp() : Mila::Logging::ConsoleSink, Mila::Logging::FileSink
- getDataPointer() : Mila::Dnn::Compute::Cuda::TransferOps
- getDatasetInfo() : Mila::Data::DataLoader< TInputDataType, TTargetDataType, TMemoryResource >
- getDataType() : Mila::Dnn::Compute::Operation< TDeviceType, TComputePrecision >, Mila::Dnn::ITensor, Mila::Dnn::Tensor< TDataType, TMemoryResource >
- getDataTypeName() : Mila::Dnn::ITensor, Mila::Dnn::Tensor< TDataType, TMemoryResource >
- getDevice() : Mila::Dnn::Compute::DeviceRegistry, Mila::Dnn::Compute::ExecutionContext< DeviceType::Vulkan >
- getDeviceCount() : Mila::Dnn::Compute::CudaDeviceRegistrar, Mila::Dnn::Compute::DeviceRegistry, Mila::Dnn::Compute::MetalDevicePlugin
- getDeviceId() : Mila::Dnn::Component< TDeviceType, TPrecision >, Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >, Mila::Dnn::Compute::CpuDevice, Mila::Dnn::Compute::CudaDevice, Mila::Dnn::Compute::Device, Mila::Dnn::Compute::ExecutionContext< DeviceType::Cpu >, Mila::Dnn::Compute::ExecutionContext< DeviceType::Cuda >, Mila::Dnn::Compute::ExecutionContext< DeviceType::Metal >, Mila::Dnn::Compute::ExecutionContext< DeviceType::Vulkan >, Mila::Dnn::Compute::IExecutionContext, Mila::Dnn::Compute::MetalDevice, Mila::Dnn::Compute::VulkanDevice, Mila::Dnn::FusedComponent< TDeviceType, TPrecision >, Mila::Dnn::Gelu< TDeviceType, TPrecision >, Mila::Dnn::GroupedQueryAttention< TDeviceType, TComputePrecision, TKvPolicy >, Mila::Dnn::ITensor, Mila::Dnn::LayerNorm< TDeviceType, TPrecision >, Mila::Dnn::Linear< TDeviceType, TComputePrecision, TWeightQuant >, Mila::Dnn::Lpe< TDeviceType, TIndex, TPrecision >, Mila::Dnn::Model< TDeviceType, TPrecision >, Mila::Dnn::MultiHeadAttention< TDeviceType, TPrecision >, Mila::Dnn::Network< TDeviceType, TPrecision >, Mila::Dnn::Residual< TDeviceType, TPrecision >, Mila::Dnn::RmsNorm< TDeviceType, TPrecision >, Mila::Dnn::Rope< TDeviceType, TPrecision >, Mila::Dnn::Softmax< TDeviceType, TPrecision >, Mila::Dnn::SoftmaxCrossEntropy< TDeviceType, TLogits, TTargets, TPrecision >, Mila::Dnn::Swiglu< TDeviceType, TPrecision >, Mila::Dnn::Tensor< TDataType, TMemoryResource >, Mila::Dnn::TokenEmbedding< TDeviceType, TIndex, TPrecision >
- getDeviceIndex() : Mila::Dnn::Compute::MetalDevice
- getDeviceInfo() : Mila::Dnn::Compute::VulkanMemoryResource
- getDeviceMemorySize() : Mila::Dnn::Compute::MetalDevice, Mila::Dnn::Compute::VulkanDevice
- getDeviceName() : Mila::Dnn::Compute::CpuDevice, Mila::Dnn::Compute::CudaDevice, Mila::Dnn::Compute::Device, Mila::Dnn::Compute::ExecutionContext< DeviceType::Metal >, Mila::Dnn::Compute::ExecutionContext< DeviceType::Vulkan >, Mila::Dnn::Compute::MetalDevice, Mila::Dnn::Compute::VulkanDevice
- getDeviceScratchBuffer() : Mila::Dnn::Compute::ExecutionContext< DeviceType::Cuda >
- getDeviceType() : Mila::Dnn::Component< TDeviceType, TPrecision >, Mila::Dnn::Compute::CpuDevice, Mila::Dnn::Compute::CudaDevice, Mila::Dnn::Compute::Device, Mila::Dnn::Compute::ExecutionContext< DeviceType::Metal >, Mila::Dnn::Compute::ExecutionContext< DeviceType::Vulkan >, Mila::Dnn::Compute::MetalDevice, Mila::Dnn::Compute::Operation< TDeviceType, TComputePrecision >, Mila::Dnn::Compute::VulkanDevice, Mila::Dnn::ITensor, Mila::Dnn::Tensor< TDataType, TMemoryResource >
- getDouble() : Mila::Data::SerializationMetadata, Mila::Dnn::Optimizers::SerializationMetadata, Mila::Dnn::Serialization::SerializationMetadata, Mila::Dnn::SerializationMetadata
- getDoubleVector() : Mila::Data::SerializationMetadata, Mila::Dnn::Optimizers::SerializationMetadata, Mila::Dnn::Serialization::SerializationMetadata, Mila::Dnn::SerializationMetadata
- getEffectiveHiddenDimension() : Mila::Dnn::GptBlockConfig
- getEmbeddingDim() : Mila::Dnn::Lpe< TDeviceType, TIndex, TPrecision >, Mila::Dnn::LpeConfig, Mila::Dnn::RopeConfig, Mila::Dnn::TokenEmbedding< TDeviceType, TIndex, TPrecision >, Mila::Dnn::TokenEmbeddingConfig
- getEmbeddingSize() : Mila::Dnn::GptConfig
- getEnabledTokens() : Mila::Data::SpecialTokens
- getEosTokenId() : Mila::Data::BpeTokenizer, Mila::Data::CharTokenizer, Mila::Data::Tokenizer
- getEpsilon() : Mila::Dnn::Compute::CpuAdamWOptimizer< TPrecision >, Mila::Dnn::Compute::CudaAdamWOptimizer< TPrecision >, Mila::Dnn::LayerNormConfig, Mila::Dnn::Optimizers::AdamWConfig, Mila::Dnn::Optimizers::AdamWOptimizer< TDeviceType, TPrecision >, Mila::Dnn::RmsNormConfig
- getError() : CudaException, Mila::Dnn::Compute::CublasLtError
- getExecutionContext() : Mila::Dnn::Component< TDeviceType, TPrecision >, Mila::Dnn::GptTransformer< TDeviceType, TPrecision >, Mila::Dnn::LlamaTransformer< TDeviceType, TPrecision, TWeightQuantization, TKvCachePolicy >
- getFile() : Mila::Dnn::Compute::CublasLtError, Mila::Dnn::Compute::CudaError
- getFilename() : Mila::Dnn::Serialization::PretrainedModelReader, Mila::Dnn::Serialization::Serializer, Mila::Dnn::Serialization::ZipSerializer
- getFilepath() : Mila::Dnn::Serialization::ModelArchive
- getFileSize() : Mila::Dnn::Serialization::ArchiveSerializer, Mila::Dnn::Serialization::ModelArchive, Mila::Dnn::Serialization::ZipSerializer
- getFileType() : Mila::Data::MilaFileHeader
- getFunction() : Mila::Dnn::Compute::CublasLtError, Mila::Dnn::Compute::CudaError
- getGenerator() : Mila::Core::RandomGenerator
- getGradients() : Mila::Dnn::Component< TDeviceType, TPrecision >, Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >, Mila::Dnn::FusedComponent< TDeviceType, TPrecision >, Mila::Dnn::Gelu< TDeviceType, TPrecision >, Mila::Dnn::GroupedQueryAttention< TDeviceType, TComputePrecision, TKvPolicy >, Mila::Dnn::LayerNorm< TDeviceType, TPrecision >, Mila::Dnn::Linear< TDeviceType, TComputePrecision, TWeightQuant >, Mila::Dnn::Lpe< TDeviceType, TIndex, TPrecision >, Mila::Dnn::MultiHeadAttention< TDeviceType, TPrecision >, Mila::Dnn::Residual< TDeviceType, TPrecision >, Mila::Dnn::RmsNorm< TDeviceType, TPrecision >, Mila::Dnn::Rope< TDeviceType, TPrecision >, Mila::Dnn::Softmax< TDeviceType, TPrecision >, Mila::Dnn::SoftmaxCrossEntropy< TDeviceType, TLogits, TTargets, TPrecision >, Mila::Dnn::Swiglu< TDeviceType, TPrecision >, Mila::Dnn::TokenEmbedding< TDeviceType, TIndex, TPrecision >
- getGroupSize() : Mila::Dnn::GqaConfig
- getHeadDim() : Mila::Dnn::GqaConfig, Mila::Dnn::RopeConfig
- getHiddenDimension() : Mila::Dnn::LlamaConfig
- getHiddenSize() : Mila::Dnn::GptBlockConfig, Mila::Dnn::GptConfig, Mila::Dnn::MLPConfig
- getIdOffset() : Mila::Data::SpecialTokens
- getInfo() : Mila::Dnn::Extensibility::IModulePlugin, MyCustomLayerPlugin
- getInputFeatures() : Mila::Dnn::LinearConfig, Mila::Dnn::MLPConfig
- getInstance() : Mila::Core::RandomGenerator
- getInt() : Mila::Data::SerializationMetadata, Mila::Dnn::Optimizers::SerializationMetadata, Mila::Dnn::Serialization::SerializationMetadata, Mila::Dnn::SerializationMetadata
- getIntVector() : Mila::Data::SerializationMetadata, Mila::Dnn::Optimizers::SerializationMetadata, Mila::Dnn::Serialization::SerializationMetadata, Mila::Dnn::SerializationMetadata
- getKvCacheCompression() : Mila::Dnn::LanguageModelConfig< TDerived >
- getLanguageNetwork() : Mila::Dnn::LanguageModel< TDeviceType, TPrecision >
- getLastGenerationStatistics() : Mila::Dnn::LanguageModel< TDeviceType, TPrecision >
- getLearningRate() : Mila::Dnn::Compute::CpuAdamWOptimizer< TPrecision >, Mila::Dnn::Compute::CudaAdamWOptimizer< TPrecision >, Mila::Dnn::Compute::Optimizer< TDeviceType, TPrecision >, Mila::Dnn::ConstantLRScheduler, Mila::Dnn::CosineLRScheduler, Mila::Dnn::LearningRateScheduler, Mila::Dnn::LinearLRScheduler, Mila::Dnn::Optimizers::AdamWConfig, Mila::Dnn::Optimizers::AdamWOptimizer< TDeviceType, TPrecision >
- getLevel() : Mila::Logging::ConsoleSink, Mila::Logging::FileSink, Mila::Logging::Logger, Mila::Logging::NullSink
- getLine() : Mila::Dnn::Compute::CublasLtError, Mila::Dnn::Compute::CudaError
- getLocationInfo() : Mila::Logging::ConsoleSink, Mila::Logging::FileSink
- getMajor() : Mila::Version
- getMaxMerges() : Mila::Data::BpeVocabularyConfig
- getMaxSequenceLength() : Mila::Dnn::GptConfig, Mila::Dnn::LlamaConfig, Mila::Dnn::Lpe< TDeviceType, TIndex, TPrecision >, Mila::Dnn::LpeConfig, Mila::Dnn::RopeConfig
- getMaxTensorSizeBytes() : Mila::Dnn::Serialization::PretrainedModelReader
- getMaxThreadsPerBlock() : Mila::Dnn::Compute::CudaDevice
- getMaxThreadsPerThreadgroup() : Mila::Dnn::Compute::MetalDevice
- getMaxWorkGroupSize() : Mila::Dnn::Compute::VulkanDevice
- getMemoryResource() : Mila::Dnn::ITensor, Mila::Dnn::Tensor< TDataType, TMemoryResource >, Mila::Dnn::TensorBuffer< TDataType, TMemoryResource, TrackMemory >
- getMemoryStats() : Mila::Dnn::Component< TDeviceType, TPrecision >, Mila::Dnn::Gelu< TDeviceType, TPrecision >, Mila::Dnn::GptBlock< TDeviceType, TPrecision >, Mila::Dnn::GptTransformer< TDeviceType, TPrecision >, Mila::Dnn::GroupedQueryAttention< TDeviceType, TComputePrecision, TKvPolicy >, Mila::Dnn::LayerNorm< TDeviceType, TPrecision >, Mila::Dnn::Linear< TDeviceType, TComputePrecision, TWeightQuant >, Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >, Mila::Dnn::LlamaTransformer< TDeviceType, TPrecision, TWeightQuantization, TKvCachePolicy >, Mila::Dnn::Lpe< TDeviceType, TIndex, TPrecision >, Mila::Dnn::MLP< TDeviceType, TPrecision >, Mila::Dnn::Model< TDeviceType, TPrecision >, Mila::Dnn::MultiHeadAttention< TDeviceType, TPrecision >, Mila::Dnn::Residual< TDeviceType, TPrecision >, Mila::Dnn::RmsNorm< TDeviceType, TPrecision >, Mila::Dnn::Rope< TDeviceType, TPrecision >, Mila::Dnn::Softmax< TDeviceType, TPrecision >, Mila::Dnn::Swiglu< TDeviceType, TPrecision >, Mila::Dnn::TokenEmbedding< TDeviceType, TIndex, TPrecision >
- getMergePriority() : Mila::Data::BpeVocabulary
- getMergeRules() : Mila::Data::BpeVocabulary
- getMessage() : Mila::Dnn::Compute::CublasLtError, Mila::Dnn::Compute::CudaError
- getMetadata() : Mila::Data::MilaFileHeader, Mila::Dnn::Serialization::ArchiveSerializer, Mila::Dnn::Serialization::ITensorBlob, Mila::Dnn::Serialization::ModelArchive, Mila::Dnn::Serialization::TensorBlob< MR >, Mila::Dnn::Serialization::ZipSerializer
- getMinFrequency() : Mila::Data::BpeVocabularyConfig
- getMinor() : Mila::Version
- getMode() : Mila::Dnn::Serialization::ModelArchive
- getModelDim() : Mila::Dnn::GptBlockConfig, Mila::Dnn::GqaConfig, Mila::Dnn::GroupedQueryAttention< TDeviceType, TComputePrecision, TKvPolicy >, Mila::Dnn::LlamaConfig, Mila::Dnn::MultiHeadAttention< TDeviceType, TPrecision >, Mila::Dnn::MultiHeadAttentionConfig
- getMostFrequentPair() : Mila::Data::BpeVocabulary
- getMultiprocessorCount() : Mila::Dnn::Compute::CudaDevice
- getName() : Mila::Dnn::Component< TDeviceType, TPrecision >, Mila::Dnn::Compute::CpuAttentionOp, Mila::Dnn::Compute::CpuCrossEntropyOp, Mila::Dnn::Compute::CpuEncoderOp, Mila::Dnn::Compute::CpuGeluOp, Mila::Dnn::Compute::CpuLayerNormOp, Mila::Dnn::Compute::CpuLinearOp, Mila::Dnn::Compute::CpuResidualOp, Mila::Dnn::Compute::CpuSoftmaxCrossEntropyOp< TPrecision, TLogits, TTargets >, Mila::Dnn::Compute::CpuSoftmaxOp, Mila::Dnn::Compute::Cuda::Gelu::CudaGeluOp< TPrecision >, Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >, Mila::Dnn::Compute::Cuda::LayerNorm::CudaLayerNormOp< TPrecision >, Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >, Mila::Dnn::Compute::Cuda::Lpe::CudaLpeOp< TInput, TPrecision >, Mila::Dnn::Compute::Cuda::MatMulBiasGelu::CudaMatMulBiasGeluOp< TInput, TOutput >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::CudaMultiHeadAttentionOp< TPrecision >, Mila::Dnn::Compute::Cuda::Residual::CudaResidualOp< TInputA, TInputB, TPrecision >, Mila::Dnn::Compute::Cuda::RmsNorm::CudaRmsNormOp< TPrecision >, Mila::Dnn::Compute::Cuda::Rope::CudaRopeOp< TComputePrecision >, Mila::Dnn::Compute::Cuda::Softmax::CudaSoftmaxOp< TPrecision >, Mila::Dnn::Compute::Cuda::SoftmaxCrossEntropy::CudaSoftmaxCrossEntropyOp< TPrecision, TLogits, TTargets >, Mila::Dnn::Compute::Cuda::Swiglu::CudaSwigluOp< TPrecision >, Mila::Dnn::Compute::Cuda::TokenEmbedding::CudaTokenEmbeddingOp< TInput, TPrecision >, Mila::Dnn::Compute::CudaDeviceProps, Mila::Dnn::Compute::Operation< TDeviceType, TComputePrecision >, Mila::Dnn::ITensor, Mila::Dnn::Tensor< TDataType, TMemoryResource >
- getNativeDevice() : Mila::Dnn::Compute::MetalDevice
- getNativeHandle() : Mila::Dnn::Compute::VulkanDevice
- getNextId() : Mila::Dnn::UniqueIdGenerator
- getNormalizedShape() : Mila::Dnn::LayerNormConfig, Mila::Dnn::RmsNormConfig
- getNumHeads() : Mila::Dnn::GptBlockConfig, Mila::Dnn::GptConfig, Mila::Dnn::GqaConfig, Mila::Dnn::GroupedQueryAttention< TDeviceType, TComputePrecision, TKvPolicy >, Mila::Dnn::LlamaConfig, Mila::Dnn::MultiHeadAttention< TDeviceType, TPrecision >, Mila::Dnn::MultiHeadAttentionConfig, Mila::Dnn::RopeConfig
- getNumKVHeads() : Mila::Dnn::LlamaConfig, Mila::Dnn::RopeConfig
- getNumKvHeads() : Mila::Dnn::GqaConfig, Mila::Dnn::GroupedQueryAttention< TDeviceType, TComputePrecision, TKvPolicy >
- getNumLayers() : Mila::Dnn::GptConfig, Mila::Dnn::LlamaConfig
- getOperationType() : Mila::Dnn::Compute::CpuAttentionOp, Mila::Dnn::Compute::CpuEncoderOp, Mila::Dnn::Compute::CpuGeluOp, Mila::Dnn::Compute::CpuLayerNormOp, Mila::Dnn::Compute::CpuLinearOp, Mila::Dnn::Compute::CpuResidualOp, Mila::Dnn::Compute::CpuSoftmaxCrossEntropyOp< TPrecision, TLogits, TTargets >, Mila::Dnn::Compute::CpuSoftmaxOp, Mila::Dnn::Compute::Cuda::Gelu::CudaGeluOp< TPrecision >, Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >, Mila::Dnn::Compute::Cuda::LayerNorm::CudaLayerNormOp< TPrecision >, Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >, Mila::Dnn::Compute::Cuda::Lpe::CudaLpeOp< TInput, TPrecision >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::CudaMultiHeadAttentionOp< TPrecision >, Mila::Dnn::Compute::Cuda::Residual::CudaResidualOp< TInputA, TInputB, TPrecision >, Mila::Dnn::Compute::Cuda::RmsNorm::CudaRmsNormOp< TPrecision >, Mila::Dnn::Compute::Cuda::Rope::CudaRopeOp< TComputePrecision >, Mila::Dnn::Compute::Cuda::Softmax::CudaSoftmaxOp< TPrecision >, Mila::Dnn::Compute::Cuda::SoftmaxCrossEntropy::CudaSoftmaxCrossEntropyOp< TPrecision, TLogits, TTargets >, Mila::Dnn::Compute::Cuda::Swiglu::CudaSwigluOp< TPrecision >, Mila::Dnn::Compute::Cuda::TokenEmbedding::CudaTokenEmbeddingOp< TInput, TPrecision >, Mila::Dnn::Compute::Operation< TDeviceType, TComputePrecision >
- getOrBuildPartialAVPlan() : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >
- getOrBuildPartialAVPlan_optimized() : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >
- getOrBuildPartialQKPlan() : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >
- getOrBuildPartialQKPlan_optimized() : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >
- getOutputFeatures() : Mila::Dnn::LinearConfig
- getPadTokenId() : Mila::Data::BpeTokenizer, Mila::Data::CharTokenizer, Mila::Data::Tokenizer
- getParameterCount() : Mila::Dnn::Compute::CpuAdamWOptimizer< TPrecision >, Mila::Dnn::Compute::CudaAdamWOptimizer< TPrecision >, Mila::Dnn::Optimizers::AdamWOptimizer< TDeviceType, TPrecision >
- getParameterNames() : Mila::Dnn::Component< TDeviceType, TPrecision >
- getParameters() : Mila::Dnn::Component< TDeviceType, TPrecision >, Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >, Mila::Dnn::FusedComponent< TDeviceType, TPrecision >, Mila::Dnn::Gelu< TDeviceType, TPrecision >, Mila::Dnn::GroupedQueryAttention< TDeviceType, TComputePrecision, TKvPolicy >, Mila::Dnn::LayerNorm< TDeviceType, TPrecision >, Mila::Dnn::Linear< TDeviceType, TComputePrecision, TWeightQuant >, Mila::Dnn::Lpe< TDeviceType, TIndex, TPrecision >, Mila::Dnn::MultiHeadAttention< TDeviceType, TPrecision >, Mila::Dnn::Residual< TDeviceType, TPrecision >, Mila::Dnn::RmsNorm< TDeviceType, TPrecision >, Mila::Dnn::Rope< TDeviceType, TPrecision >, Mila::Dnn::Softmax< TDeviceType, TPrecision >, Mila::Dnn::SoftmaxCrossEntropy< TDeviceType, TLogits, TTargets, TPrecision >, Mila::Dnn::Swiglu< TDeviceType, TPrecision >, Mila::Dnn::TokenEmbedding< TDeviceType, TIndex, TPrecision >
- getPatch() : Mila::Version
- getPinnedStagingBuffer() : Mila::Dnn::Compute::ExecutionContext< DeviceType::Cuda >
- getPluginName() : Mila::Dnn::Compute::MetalDevicePlugin
- getPrecision() : Mila::Dnn::Component< TDeviceType, TPrecision >, Mila::Dnn::ComponentFactory
- getPrefillSize() : Mila::Dnn::BuildContext
- getPreRelease() : Mila::Version
- getPreTokenizationMode() : Mila::Data::BpeVocabularyConfig
- getPreTokenizationPattern() : Mila::Data::BpeVocabularyConfig
- getPretrainedMetadata() : Mila::Dnn::Serialization::PretrainedModelReader
- getProbability() : Mila::Dnn::Dropout< TDeviceType, TInput, TOutput >, Mila::Dnn::DropoutConfig
- getProperties() : Mila::Dnn::Compute::CudaDevice
- getQueue() : Mila::Dnn::Compute::ExecutionContext< DeviceType::Vulkan >
- getRecommendedMaxWorkingSetSize() : Mila::Dnn::Compute::MetalDevice
- getRegisteredOperations() : Mila::Dnn::Compute::OperationRegistry
- getRegistry() : Mila::Dnn::NetworkFactory
- getResidualScale() : Mila::Dnn::GptBlockConfig
- getRMSNormEpsilon() : Mila::Dnn::LlamaConfig
- getRoPEScalingFactor() : Mila::Dnn::LlamaConfig
- getRoPETheta() : Mila::Dnn::LlamaConfig
- getRotaryDim() : Mila::Dnn::RopeConfig
- getRuntimeMode() : Mila::Dnn::BuildContext, Mila::Dnn::Component< TDeviceType, TPrecision >, Mila::Dnn::Model< TDeviceType, TPrecision >
- getScalingFactor() : Mila::Dnn::ResidualConfig
- getSeed() : Mila::Core::RandomGenerator, Mila::Dnn::Dropout< TDeviceType, TInput, TOutput >
- getShape() : Mila::Data::SerializationMetadata, Mila::Dnn::Optimizers::SerializationMetadata, Mila::Dnn::Serialization::SerializationMetadata, Mila::Dnn::SerializationMetadata
- getSharedMemoryPerBlock() : Mila::Dnn::Compute::CudaDevice
- getSize() : Mila::Data::BpeVocabulary, Mila::Data::CharVocabulary, Mila::Data::TokenizerVocabulary
- getSpecialTokenId() : Mila::Data::BpeVocabulary
- getSpecialTokenList() : Mila::Data::BpeVocabulary
- getSpecialTokens() : Mila::Data::BpeVocabularyConfig, Mila::Data::CharVocabularyConfig
- getStateMemorySize() : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >, Mila::Dnn::Compute::Cuda::Rope::CudaRopeOp< TComputePrecision >, Mila::Dnn::Compute::Operation< TDeviceType, TComputePrecision >
- getStepCount() : Mila::Dnn::Compute::CpuAdamWOptimizer< TPrecision >, Mila::Dnn::Compute::CudaAdamWOptimizer< TPrecision >, Mila::Dnn::Optimizers::AdamWOptimizer< TDeviceType, TPrecision >
- getStorageSize() : Mila::Dnn::ITensor, Mila::Dnn::Tensor< TDataType, TMemoryResource >
- getStream() : Mila::Dnn::Compute::ExecutionContext< DeviceType::Cuda >
- getString() : Mila::Data::SerializationMetadata, Mila::Data::SpecialTokens, Mila::Dnn::Optimizers::SerializationMetadata, Mila::Dnn::Serialization::SerializationMetadata, Mila::Dnn::SerializationMetadata
- getStringVector() : Mila::Data::SerializationMetadata, Mila::Dnn::Optimizers::SerializationMetadata, Mila::Dnn::Serialization::SerializationMetadata, Mila::Dnn::SerializationMetadata
- getSymbol() : Mila::Dnn::Extensibility::PluginManager
- getTensorBlobMetadata() : Mila::Dnn::Serialization::PretrainedModelReader
- getTensorNames() : Mila::Dnn::Serialization::PretrainedModelReader
- getTensorSizeBytes() : Mila::Dnn::Serialization::PretrainedModelReader
- getTotalGlobalMemory() : Mila::Dnn::Compute::CudaDevice
- getTrainingMode() : Mila::Dnn::Component< TDeviceType, TPrecision >
- getType() : Mila::Dnn::Component< TDeviceType, TPrecision >, Mila::Dnn::Dropout< TDeviceType, TInput, TOutput >, Mila::Dnn::Gelu< TDeviceType, TPrecision >, Mila::Dnn::GptBlock< TDeviceType, TPrecision >, Mila::Dnn::GptTransformer< TDeviceType, TPrecision >, Mila::Dnn::GroupedQueryAttention< TDeviceType, TComputePrecision, TKvPolicy >, Mila::Dnn::LayerNorm< TDeviceType, TPrecision >, Mila::Dnn::Linear< TDeviceType, TComputePrecision, TWeightQuant >, Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >, Mila::Dnn::LlamaTransformer< TDeviceType, TPrecision, TWeightQuantization, TKvCachePolicy >, Mila::Dnn::Lpe< TDeviceType, TIndex, TPrecision >, Mila::Dnn::MLP< TDeviceType, TPrecision >, Mila::Dnn::MultiHeadAttention< TDeviceType, TPrecision >, Mila::Dnn::Network< TDeviceType, TPrecision >, Mila::Dnn::Residual< TDeviceType, TPrecision >, Mila::Dnn::RmsNorm< TDeviceType, TPrecision >, Mila::Dnn::Rope< TDeviceType, TPrecision >, Mila::Dnn::Softmax< TDeviceType, TPrecision >, Mila::Dnn::Swiglu< TDeviceType, TPrecision >, Mila::Dnn::TokenEmbedding< TDeviceType, TIndex, TPrecision >
- getUId() : Mila::Dnn::ITensor, Mila::Dnn::Tensor< TDataType, TMemoryResource >
- getUnderlying() : Mila::Dnn::Compute::TrackedMemoryResource
- getUseBias() : Mila::Dnn::GptConfig
- getValue() : Mila::Data::SerializationMetadata, Mila::Dnn::Optimizers::SerializationMetadata, Mila::Dnn::Serialization::SerializationMetadata, Mila::Dnn::SerializationMetadata
- getVocab() : Mila::Data::BpeTokenizer
- getVocabSize() : Mila::Data::BpeTokenizer, Mila::Data::BpeVocabularyConfig, Mila::Data::CharTokenizer, Mila::Data::Tokenizer, Mila::Dnn::CrossEntropyConfig, Mila::Dnn::GptConfig, Mila::Dnn::LlamaConfig, Mila::Dnn::SoftmaxCrossEntropy< TDeviceType, TLogits, TTargets, TPrecision >, Mila::Dnn::TokenEmbedding< TDeviceType, TIndex, TPrecision >, Mila::Dnn::TokenEmbeddingConfig
- getVocabularyLength() : Mila::Dnn::Lpe< TDeviceType, TIndex, TPrecision >, Mila::Dnn::LpeConfig
- getWarpSize() : Mila::Dnn::Compute::CudaDevice
- getWeightCudaDataType() : Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >
- getWeightDecay() : Mila::Dnn::Compute::CpuAdamWOptimizer< TPrecision >, Mila::Dnn::Compute::CudaAdamWOptimizer< TPrecision >, Mila::Dnn::Optimizers::AdamWConfig, Mila::Dnn::Optimizers::AdamWOptimizer< TDeviceType, TPrecision >
- getWeightQuantization() : Mila::Dnn::LanguageModelConfig< TDerived >
- getWpeGrad() : Mila::Dnn::Lpe< TDeviceType, TIndex, TPrecision >
- getWteGrad() : Mila::Dnn::Lpe< TDeviceType, TIndex, TPrecision >, Mila::Dnn::TokenEmbedding< TDeviceType, TIndex, TPrecision >
- GptBlock() : Mila::Dnn::GptBlock< TDeviceType, TPrecision >
- GptBlockConfig() : Mila::Dnn::GptBlockConfig
- GptConfig() : Mila::Dnn::GptConfig
- GptModel() : Mila::Dnn::GptModel< TDeviceType, TPrecision >
- gptStyle() : Mila::Data::SpecialTokens
- GptTransformer() : Mila::Dnn::GptTransformer< TDeviceType, TPrecision >
- GqaConfig() : Mila::Dnn::GqaConfig
- GroupedQueryAttention() : Mila::Dnn::GroupedQueryAttention< TDeviceType, TComputePrecision, TKvPolicy >