Here is a list of all functions with links to the classes they belong to:

- g -

Gelu() : Mila::Dnn::Gelu< TDeviceType, TPrecision >
generate() : Mila::Dnn::LanguageModel< TDeviceType, TPrecision >
generateMask() : Mila::Dnn::Dropout< TDeviceType, TInput, TOutput >
generateStreaming() : Mila::Dnn::LanguageModel< TDeviceType, TPrecision >
get() : Mila::Dnn::Compute::Cuda::CublasLtPlanCache< TPlan >
get_native_type() : Mila::Dnn::VulkanTensorTraits
getActivationCudaDataType() : Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >
getActivationType() : Mila::Dnn::GptBlockConfig, Mila::Dnn::MLPConfig
getApproximationMethod() : Mila::Dnn::Gelu< TDeviceType, TPrecision >, Mila::Dnn::GeluConfig
getAxis() : Mila::Dnn::LayerNormConfig, Mila::Dnn::RmsNormConfig, Mila::Dnn::Softmax< TDeviceType, TPrecision >, Mila::Dnn::SoftmaxConfig
getBase() : Mila::Dnn::RopeConfig
getBeta1() : Mila::Dnn::Compute::CpuAdamWOptimizer< TPrecision >, Mila::Dnn::Compute::CudaAdamWOptimizer< TPrecision >, Mila::Dnn::Optimizers::AdamWConfig, Mila::Dnn::Optimizers::AdamWOptimizer< TDeviceType, TPrecision >
getBeta2() : Mila::Dnn::Compute::CpuAdamWOptimizer< TPrecision >, Mila::Dnn::Compute::CudaAdamWOptimizer< TPrecision >, Mila::Dnn::Optimizers::AdamWConfig, Mila::Dnn::Optimizers::AdamWOptimizer< TDeviceType, TPrecision >
getBool() : Mila::Data::SerializationMetadata, Mila::Dnn::Optimizers::SerializationMetadata, Mila::Dnn::Serialization::SerializationMetadata, Mila::Dnn::SerializationMetadata
getBosTokenId() : Mila::Data::BpeTokenizer, Mila::Data::CharTokenizer, Mila::Data::Tokenizer
getBufferString() : Mila::Dnn::Tensor< TDataType, TMemoryResource >
getByteDecoder() : Mila::Data::BpeVocabulary
getByteEncoder() : Mila::Data::BpeVocabulary
getCommandQueue() : Mila::Dnn::Compute::ExecutionContext< DeviceType::Metal >
getComponent() : Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >
getComponentAs() : Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >
getComponentName() : Mila::Dnn::ComponentFactory
getComponents() : Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >
getComponentVersion() : Mila::Dnn::ComponentFactory
getComputeCapability() : Mila::Dnn::Compute::CudaDevice, Mila::Dnn::Compute::CudaDeviceProps
getComputeCapabilityVersion() : Mila::Dnn::Compute::CudaDevice
getComputeTypes() : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >, Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::CudaMultiHeadAttentionOp< TPrecision >
getConfig() : Mila::Data::BpeTrainer, Mila::Data::BpeVocabulary, Mila::Data::CharTrainer, Mila::Data::CharVocabulary, Mila::Dnn::Compute::CpuLinearOp, Mila::Dnn::Compute::CpuSoftmaxCrossEntropyOp< TPrecision, TLogits, TTargets >, Mila::Dnn::Compute::CpuSoftmaxOp, Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >, Mila::Dnn::Compute::Cuda::LayerNorm::CudaLayerNormOp< TPrecision >, Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::CudaMultiHeadAttentionOp< TPrecision >, Mila::Dnn::Compute::Cuda::RmsNorm::CudaRmsNormOp< TPrecision >, Mila::Dnn::Compute::Cuda::Softmax::CudaSoftmaxOp< TPrecision >, Mila::Dnn::Compute::Cuda::SoftmaxCrossEntropy::CudaSoftmaxCrossEntropyOp< TPrecision, TLogits, TTargets >, Mila::Dnn::GptModel< TDeviceType, TPrecision >, Mila::Dnn::GroupedQueryAttention< TDeviceType, TComputePrecision, TKvPolicy >, Mila::Dnn::Linear< TDeviceType, TComputePrecision, TWeightQuant >, Mila::Dnn::LlamaModel< TDeviceType, TPrecision >, Mila::Dnn::MultiHeadAttention< TDeviceType, TPrecision >, Mila::Dnn::SoftmaxCrossEntropy< TDeviceType, TLogits, TTargets, TPrecision >
getConnectionType() : Mila::Dnn::ResidualConfig
getContextLength() : Mila::Dnn::LanguageModelConfig< TDerived >, Mila::Dnn::ModelConfig
getCorpusSize() : Mila::Data::BpeTrainer, Mila::Data::CharTrainer
getCublasLtHandle() : Mila::Dnn::Compute::ExecutionContext< DeviceType::Cuda >
getCublasLtWorkspace() : Mila::Dnn::Compute::ExecutionContext< DeviceType::Cuda >
getCublasLtWorkspaceSize() : Mila::Dnn::Compute::ExecutionContext< DeviceType::Cuda >
getCudaDataType() : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::CudaMultiHeadAttentionOp< TPrecision >
getCurandGenerator() : Mila::Dnn::Compute::ExecutionContext< DeviceType::Cuda >
getCurrentTimestamp() : Mila::Logging::ConsoleSink, Mila::Logging::FileSink
getDataPointer() : Mila::Dnn::Compute::Cuda::TransferOps
getDatasetInfo() : Mila::Data::DataLoader< TInputDataType, TTargetDataType, TMemoryResource >
getDataType() : Mila::Dnn::Compute::Operation< TDeviceType, TComputePrecision >, Mila::Dnn::ITensor, Mila::Dnn::Tensor< TDataType, TMemoryResource >
getDataTypeName() : Mila::Dnn::ITensor, Mila::Dnn::Tensor< TDataType, TMemoryResource >
getDevice() : Mila::Dnn::Compute::DeviceRegistry, Mila::Dnn::Compute::ExecutionContext< DeviceType::Vulkan >
getDeviceCount() : Mila::Dnn::Compute::CudaDeviceRegistrar, Mila::Dnn::Compute::DeviceRegistry, Mila::Dnn::Compute::MetalDevicePlugin
getDeviceId() : Mila::Dnn::Component< TDeviceType, TPrecision >, Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >, Mila::Dnn::Compute::CpuDevice, Mila::Dnn::Compute::CudaDevice, Mila::Dnn::Compute::Device, Mila::Dnn::Compute::ExecutionContext< DeviceType::Cpu >, Mila::Dnn::Compute::ExecutionContext< DeviceType::Cuda >, Mila::Dnn::Compute::ExecutionContext< DeviceType::Metal >, Mila::Dnn::Compute::ExecutionContext< DeviceType::Vulkan >, Mila::Dnn::Compute::IExecutionContext, Mila::Dnn::Compute::MetalDevice, Mila::Dnn::Compute::VulkanDevice, Mila::Dnn::FusedComponent< TDeviceType, TPrecision >, Mila::Dnn::Gelu< TDeviceType, TPrecision >, Mila::Dnn::GroupedQueryAttention< TDeviceType, TComputePrecision, TKvPolicy >, Mila::Dnn::ITensor, Mila::Dnn::LayerNorm< TDeviceType, TPrecision >, Mila::Dnn::Linear< TDeviceType, TComputePrecision, TWeightQuant >, Mila::Dnn::Lpe< TDeviceType, TIndex, TPrecision >, Mila::Dnn::Model< TDeviceType, TPrecision >, Mila::Dnn::MultiHeadAttention< TDeviceType, TPrecision >, Mila::Dnn::Network< TDeviceType, TPrecision >, Mila::Dnn::Residual< TDeviceType, TPrecision >, Mila::Dnn::RmsNorm< TDeviceType, TPrecision >, Mila::Dnn::Rope< TDeviceType, TPrecision >, Mila::Dnn::Softmax< TDeviceType, TPrecision >, Mila::Dnn::SoftmaxCrossEntropy< TDeviceType, TLogits, TTargets, TPrecision >, Mila::Dnn::Swiglu< TDeviceType, TPrecision >, Mila::Dnn::Tensor< TDataType, TMemoryResource >, Mila::Dnn::TokenEmbedding< TDeviceType, TIndex, TPrecision >
getDeviceIndex() : Mila::Dnn::Compute::MetalDevice
getDeviceInfo() : Mila::Dnn::Compute::VulkanMemoryResource
getDeviceMemorySize() : Mila::Dnn::Compute::MetalDevice, Mila::Dnn::Compute::VulkanDevice
getDeviceName() : Mila::Dnn::Compute::CpuDevice, Mila::Dnn::Compute::CudaDevice, Mila::Dnn::Compute::Device, Mila::Dnn::Compute::ExecutionContext< DeviceType::Metal >, Mila::Dnn::Compute::ExecutionContext< DeviceType::Vulkan >, Mila::Dnn::Compute::MetalDevice, Mila::Dnn::Compute::VulkanDevice
getDeviceScratchBuffer() : Mila::Dnn::Compute::ExecutionContext< DeviceType::Cuda >
getDeviceType() : Mila::Dnn::Component< TDeviceType, TPrecision >, Mila::Dnn::Compute::CpuDevice, Mila::Dnn::Compute::CudaDevice, Mila::Dnn::Compute::Device, Mila::Dnn::Compute::ExecutionContext< DeviceType::Metal >, Mila::Dnn::Compute::ExecutionContext< DeviceType::Vulkan >, Mila::Dnn::Compute::MetalDevice, Mila::Dnn::Compute::Operation< TDeviceType, TComputePrecision >, Mila::Dnn::Compute::VulkanDevice, Mila::Dnn::ITensor, Mila::Dnn::Tensor< TDataType, TMemoryResource >
getDouble() : Mila::Data::SerializationMetadata, Mila::Dnn::Optimizers::SerializationMetadata, Mila::Dnn::Serialization::SerializationMetadata, Mila::Dnn::SerializationMetadata
getDoubleVector() : Mila::Data::SerializationMetadata, Mila::Dnn::Optimizers::SerializationMetadata, Mila::Dnn::Serialization::SerializationMetadata, Mila::Dnn::SerializationMetadata
getEffectiveHiddenDimension() : Mila::Dnn::GptBlockConfig
getEmbeddingDim() : Mila::Dnn::Lpe< TDeviceType, TIndex, TPrecision >, Mila::Dnn::LpeConfig, Mila::Dnn::RopeConfig, Mila::Dnn::TokenEmbedding< TDeviceType, TIndex, TPrecision >, Mila::Dnn::TokenEmbeddingConfig
getEmbeddingSize() : Mila::Dnn::GptConfig
getEnabledTokens() : Mila::Data::SpecialTokens
getEosTokenId() : Mila::Data::BpeTokenizer, Mila::Data::CharTokenizer, Mila::Data::Tokenizer
getEpsilon() : Mila::Dnn::Compute::CpuAdamWOptimizer< TPrecision >, Mila::Dnn::Compute::CudaAdamWOptimizer< TPrecision >, Mila::Dnn::LayerNormConfig, Mila::Dnn::Optimizers::AdamWConfig, Mila::Dnn::Optimizers::AdamWOptimizer< TDeviceType, TPrecision >, Mila::Dnn::RmsNormConfig
getError() : CudaException, Mila::Dnn::Compute::CublasLtError
getExecutionContext() : Mila::Dnn::Component< TDeviceType, TPrecision >, Mila::Dnn::GptTransformer< TDeviceType, TPrecision >, Mila::Dnn::LlamaTransformer< TDeviceType, TPrecision, TWeightQuantization, TKvCachePolicy >
getFile() : Mila::Dnn::Compute::CublasLtError, Mila::Dnn::Compute::CudaError
getFilename() : Mila::Dnn::Serialization::PretrainedModelReader, Mila::Dnn::Serialization::Serializer, Mila::Dnn::Serialization::ZipSerializer
getFilepath() : Mila::Dnn::Serialization::ModelArchive
getFileSize() : Mila::Dnn::Serialization::ArchiveSerializer, Mila::Dnn::Serialization::ModelArchive, Mila::Dnn::Serialization::ZipSerializer
getFileType() : Mila::Data::MilaFileHeader
getFunction() : Mila::Dnn::Compute::CublasLtError, Mila::Dnn::Compute::CudaError
getGenerator() : Mila::Core::RandomGenerator
getGradients() : Mila::Dnn::Component< TDeviceType, TPrecision >, Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >, Mila::Dnn::FusedComponent< TDeviceType, TPrecision >, Mila::Dnn::Gelu< TDeviceType, TPrecision >, Mila::Dnn::GroupedQueryAttention< TDeviceType, TComputePrecision, TKvPolicy >, Mila::Dnn::LayerNorm< TDeviceType, TPrecision >, Mila::Dnn::Linear< TDeviceType, TComputePrecision, TWeightQuant >, Mila::Dnn::Lpe< TDeviceType, TIndex, TPrecision >, Mila::Dnn::MultiHeadAttention< TDeviceType, TPrecision >, Mila::Dnn::Residual< TDeviceType, TPrecision >, Mila::Dnn::RmsNorm< TDeviceType, TPrecision >, Mila::Dnn::Rope< TDeviceType, TPrecision >, Mila::Dnn::Softmax< TDeviceType, TPrecision >, Mila::Dnn::SoftmaxCrossEntropy< TDeviceType, TLogits, TTargets, TPrecision >, Mila::Dnn::Swiglu< TDeviceType, TPrecision >, Mila::Dnn::TokenEmbedding< TDeviceType, TIndex, TPrecision >
getGroupSize() : Mila::Dnn::GqaConfig
getHeadDim() : Mila::Dnn::GqaConfig, Mila::Dnn::RopeConfig
getHiddenDimension() : Mila::Dnn::LlamaConfig
getHiddenSize() : Mila::Dnn::GptBlockConfig, Mila::Dnn::GptConfig, Mila::Dnn::MLPConfig
getIdOffset() : Mila::Data::SpecialTokens
getInfo() : Mila::Dnn::Extensibility::IModulePlugin, MyCustomLayerPlugin
getInputFeatures() : Mila::Dnn::LinearConfig, Mila::Dnn::MLPConfig
getInstance() : Mila::Core::RandomGenerator
getInt() : Mila::Data::SerializationMetadata, Mila::Dnn::Optimizers::SerializationMetadata, Mila::Dnn::Serialization::SerializationMetadata, Mila::Dnn::SerializationMetadata
getIntVector() : Mila::Data::SerializationMetadata, Mila::Dnn::Optimizers::SerializationMetadata, Mila::Dnn::Serialization::SerializationMetadata, Mila::Dnn::SerializationMetadata
getKvCacheCompression() : Mila::Dnn::LanguageModelConfig< TDerived >
getLanguageNetwork() : Mila::Dnn::LanguageModel< TDeviceType, TPrecision >
getLastGenerationStatistics() : Mila::Dnn::LanguageModel< TDeviceType, TPrecision >
getLearningRate() : Mila::Dnn::Compute::CpuAdamWOptimizer< TPrecision >, Mila::Dnn::Compute::CudaAdamWOptimizer< TPrecision >, Mila::Dnn::Compute::Optimizer< TDeviceType, TPrecision >, Mila::Dnn::ConstantLRScheduler, Mila::Dnn::CosineLRScheduler, Mila::Dnn::LearningRateScheduler, Mila::Dnn::LinearLRScheduler, Mila::Dnn::Optimizers::AdamWConfig, Mila::Dnn::Optimizers::AdamWOptimizer< TDeviceType, TPrecision >
getLevel() : Mila::Logging::ConsoleSink, Mila::Logging::FileSink, Mila::Logging::Logger, Mila::Logging::NullSink
getLine() : Mila::Dnn::Compute::CublasLtError, Mila::Dnn::Compute::CudaError
getLocationInfo() : Mila::Logging::ConsoleSink, Mila::Logging::FileSink
getMajor() : Mila::Version
getMaxMerges() : Mila::Data::BpeVocabularyConfig
getMaxSequenceLength() : Mila::Dnn::GptConfig, Mila::Dnn::LlamaConfig, Mila::Dnn::Lpe< TDeviceType, TIndex, TPrecision >, Mila::Dnn::LpeConfig, Mila::Dnn::RopeConfig
getMaxTensorSizeBytes() : Mila::Dnn::Serialization::PretrainedModelReader
getMaxThreadsPerBlock() : Mila::Dnn::Compute::CudaDevice
getMaxThreadsPerThreadgroup() : Mila::Dnn::Compute::MetalDevice
getMaxWorkGroupSize() : Mila::Dnn::Compute::VulkanDevice
getMemoryResource() : Mila::Dnn::ITensor, Mila::Dnn::Tensor< TDataType, TMemoryResource >, Mila::Dnn::TensorBuffer< TDataType, TMemoryResource, TrackMemory >
getMemoryStats() : Mila::Dnn::Component< TDeviceType, TPrecision >, Mila::Dnn::Gelu< TDeviceType, TPrecision >, Mila::Dnn::GptBlock< TDeviceType, TPrecision >, Mila::Dnn::GptTransformer< TDeviceType, TPrecision >, Mila::Dnn::GroupedQueryAttention< TDeviceType, TComputePrecision, TKvPolicy >, Mila::Dnn::LayerNorm< TDeviceType, TPrecision >, Mila::Dnn::Linear< TDeviceType, TComputePrecision, TWeightQuant >, Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >, Mila::Dnn::LlamaTransformer< TDeviceType, TPrecision, TWeightQuantization, TKvCachePolicy >, Mila::Dnn::Lpe< TDeviceType, TIndex, TPrecision >, Mila::Dnn::MLP< TDeviceType, TPrecision >, Mila::Dnn::Model< TDeviceType, TPrecision >, Mila::Dnn::MultiHeadAttention< TDeviceType, TPrecision >, Mila::Dnn::Residual< TDeviceType, TPrecision >, Mila::Dnn::RmsNorm< TDeviceType, TPrecision >, Mila::Dnn::Rope< TDeviceType, TPrecision >, Mila::Dnn::Softmax< TDeviceType, TPrecision >, Mila::Dnn::Swiglu< TDeviceType, TPrecision >, Mila::Dnn::TokenEmbedding< TDeviceType, TIndex, TPrecision >
getMergePriority() : Mila::Data::BpeVocabulary
getMergeRules() : Mila::Data::BpeVocabulary
getMessage() : Mila::Dnn::Compute::CublasLtError, Mila::Dnn::Compute::CudaError
getMetadata() : Mila::Data::MilaFileHeader, Mila::Dnn::Serialization::ArchiveSerializer, Mila::Dnn::Serialization::ITensorBlob, Mila::Dnn::Serialization::ModelArchive, Mila::Dnn::Serialization::TensorBlob< MR >, Mila::Dnn::Serialization::ZipSerializer
getMinFrequency() : Mila::Data::BpeVocabularyConfig
getMinor() : Mila::Version
getMode() : Mila::Dnn::Serialization::ModelArchive
getModelDim() : Mila::Dnn::GptBlockConfig, Mila::Dnn::GqaConfig, Mila::Dnn::GroupedQueryAttention< TDeviceType, TComputePrecision, TKvPolicy >, Mila::Dnn::LlamaConfig, Mila::Dnn::MultiHeadAttention< TDeviceType, TPrecision >, Mila::Dnn::MultiHeadAttentionConfig
getMostFrequentPair() : Mila::Data::BpeVocabulary
getMultiprocessorCount() : Mila::Dnn::Compute::CudaDevice
getName() : Mila::Dnn::Component< TDeviceType, TPrecision >, Mila::Dnn::Compute::CpuAttentionOp, Mila::Dnn::Compute::CpuCrossEntropyOp, Mila::Dnn::Compute::CpuEncoderOp, Mila::Dnn::Compute::CpuGeluOp, Mila::Dnn::Compute::CpuLayerNormOp, Mila::Dnn::Compute::CpuLinearOp, Mila::Dnn::Compute::CpuResidualOp, Mila::Dnn::Compute::CpuSoftmaxCrossEntropyOp< TPrecision, TLogits, TTargets >, Mila::Dnn::Compute::CpuSoftmaxOp, Mila::Dnn::Compute::Cuda::Gelu::CudaGeluOp< TPrecision >, Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >, Mila::Dnn::Compute::Cuda::LayerNorm::CudaLayerNormOp< TPrecision >, Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >, Mila::Dnn::Compute::Cuda::Lpe::CudaLpeOp< TInput, TPrecision >, Mila::Dnn::Compute::Cuda::MatMulBiasGelu::CudaMatMulBiasGeluOp< TInput, TOutput >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::CudaMultiHeadAttentionOp< TPrecision >, Mila::Dnn::Compute::Cuda::Residual::CudaResidualOp< TInputA, TInputB, TPrecision >, Mila::Dnn::Compute::Cuda::RmsNorm::CudaRmsNormOp< TPrecision >, Mila::Dnn::Compute::Cuda::Rope::CudaRopeOp< TComputePrecision >, Mila::Dnn::Compute::Cuda::Softmax::CudaSoftmaxOp< TPrecision >, Mila::Dnn::Compute::Cuda::SoftmaxCrossEntropy::CudaSoftmaxCrossEntropyOp< TPrecision, TLogits, TTargets >, Mila::Dnn::Compute::Cuda::Swiglu::CudaSwigluOp< TPrecision >, Mila::Dnn::Compute::Cuda::TokenEmbedding::CudaTokenEmbeddingOp< TInput, TPrecision >, Mila::Dnn::Compute::CudaDeviceProps, Mila::Dnn::Compute::Operation< TDeviceType, TComputePrecision >, Mila::Dnn::ITensor, Mila::Dnn::Tensor< TDataType, TMemoryResource >
getNativeDevice() : Mila::Dnn::Compute::MetalDevice
getNativeHandle() : Mila::Dnn::Compute::VulkanDevice
getNextId() : Mila::Dnn::UniqueIdGenerator
getNormalizedShape() : Mila::Dnn::LayerNormConfig, Mila::Dnn::RmsNormConfig
getNumHeads() : Mila::Dnn::GptBlockConfig, Mila::Dnn::GptConfig, Mila::Dnn::GqaConfig, Mila::Dnn::GroupedQueryAttention< TDeviceType, TComputePrecision, TKvPolicy >, Mila::Dnn::LlamaConfig, Mila::Dnn::MultiHeadAttention< TDeviceType, TPrecision >, Mila::Dnn::MultiHeadAttentionConfig, Mila::Dnn::RopeConfig
getNumKVHeads() : Mila::Dnn::LlamaConfig, Mila::Dnn::RopeConfig
getNumKvHeads() : Mila::Dnn::GqaConfig, Mila::Dnn::GroupedQueryAttention< TDeviceType, TComputePrecision, TKvPolicy >
getNumLayers() : Mila::Dnn::GptConfig, Mila::Dnn::LlamaConfig
getOperationType() : Mila::Dnn::Compute::CpuAttentionOp, Mila::Dnn::Compute::CpuEncoderOp, Mila::Dnn::Compute::CpuGeluOp, Mila::Dnn::Compute::CpuLayerNormOp, Mila::Dnn::Compute::CpuLinearOp, Mila::Dnn::Compute::CpuResidualOp, Mila::Dnn::Compute::CpuSoftmaxCrossEntropyOp< TPrecision, TLogits, TTargets >, Mila::Dnn::Compute::CpuSoftmaxOp, Mila::Dnn::Compute::Cuda::Gelu::CudaGeluOp< TPrecision >, Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >, Mila::Dnn::Compute::Cuda::LayerNorm::CudaLayerNormOp< TPrecision >, Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >, Mila::Dnn::Compute::Cuda::Lpe::CudaLpeOp< TInput, TPrecision >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::CudaMultiHeadAttentionOp< TPrecision >, Mila::Dnn::Compute::Cuda::Residual::CudaResidualOp< TInputA, TInputB, TPrecision >, Mila::Dnn::Compute::Cuda::RmsNorm::CudaRmsNormOp< TPrecision >, Mila::Dnn::Compute::Cuda::Rope::CudaRopeOp< TComputePrecision >, Mila::Dnn::Compute::Cuda::Softmax::CudaSoftmaxOp< TPrecision >, Mila::Dnn::Compute::Cuda::SoftmaxCrossEntropy::CudaSoftmaxCrossEntropyOp< TPrecision, TLogits, TTargets >, Mila::Dnn::Compute::Cuda::Swiglu::CudaSwigluOp< TPrecision >, Mila::Dnn::Compute::Cuda::TokenEmbedding::CudaTokenEmbeddingOp< TInput, TPrecision >, Mila::Dnn::Compute::Operation< TDeviceType, TComputePrecision >
getOrBuildPartialAVPlan() : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >
getOrBuildPartialAVPlan_optimized() : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >
getOrBuildPartialQKPlan() : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >
getOrBuildPartialQKPlan_optimized() : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >
getOutputFeatures() : Mila::Dnn::LinearConfig
getPadTokenId() : Mila::Data::BpeTokenizer, Mila::Data::CharTokenizer, Mila::Data::Tokenizer
getParameterCount() : Mila::Dnn::Compute::CpuAdamWOptimizer< TPrecision >, Mila::Dnn::Compute::CudaAdamWOptimizer< TPrecision >, Mila::Dnn::Optimizers::AdamWOptimizer< TDeviceType, TPrecision >
getParameterNames() : Mila::Dnn::Component< TDeviceType, TPrecision >
getParameters() : Mila::Dnn::Component< TDeviceType, TPrecision >, Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >, Mila::Dnn::FusedComponent< TDeviceType, TPrecision >, Mila::Dnn::Gelu< TDeviceType, TPrecision >, Mila::Dnn::GroupedQueryAttention< TDeviceType, TComputePrecision, TKvPolicy >, Mila::Dnn::LayerNorm< TDeviceType, TPrecision >, Mila::Dnn::Linear< TDeviceType, TComputePrecision, TWeightQuant >, Mila::Dnn::Lpe< TDeviceType, TIndex, TPrecision >, Mila::Dnn::MultiHeadAttention< TDeviceType, TPrecision >, Mila::Dnn::Residual< TDeviceType, TPrecision >, Mila::Dnn::RmsNorm< TDeviceType, TPrecision >, Mila::Dnn::Rope< TDeviceType, TPrecision >, Mila::Dnn::Softmax< TDeviceType, TPrecision >, Mila::Dnn::SoftmaxCrossEntropy< TDeviceType, TLogits, TTargets, TPrecision >, Mila::Dnn::Swiglu< TDeviceType, TPrecision >, Mila::Dnn::TokenEmbedding< TDeviceType, TIndex, TPrecision >
getPatch() : Mila::Version
getPinnedStagingBuffer() : Mila::Dnn::Compute::ExecutionContext< DeviceType::Cuda >
getPluginName() : Mila::Dnn::Compute::MetalDevicePlugin
getPrecision() : Mila::Dnn::Component< TDeviceType, TPrecision >, Mila::Dnn::ComponentFactory
getPrefillSize() : Mila::Dnn::BuildContext
getPreRelease() : Mila::Version
getPreTokenizationMode() : Mila::Data::BpeVocabularyConfig
getPreTokenizationPattern() : Mila::Data::BpeVocabularyConfig
getPretrainedMetadata() : Mila::Dnn::Serialization::PretrainedModelReader
getProbability() : Mila::Dnn::Dropout< TDeviceType, TInput, TOutput >, Mila::Dnn::DropoutConfig
getProperties() : Mila::Dnn::Compute::CudaDevice
getQueue() : Mila::Dnn::Compute::ExecutionContext< DeviceType::Vulkan >
getRecommendedMaxWorkingSetSize() : Mila::Dnn::Compute::MetalDevice
getRegisteredOperations() : Mila::Dnn::Compute::OperationRegistry
getRegistry() : Mila::Dnn::NetworkFactory
getResidualScale() : Mila::Dnn::GptBlockConfig
getRMSNormEpsilon() : Mila::Dnn::LlamaConfig
getRoPEScalingFactor() : Mila::Dnn::LlamaConfig
getRoPETheta() : Mila::Dnn::LlamaConfig
getRotaryDim() : Mila::Dnn::RopeConfig
getRuntimeMode() : Mila::Dnn::BuildContext, Mila::Dnn::Component< TDeviceType, TPrecision >, Mila::Dnn::Model< TDeviceType, TPrecision >
getScalingFactor() : Mila::Dnn::ResidualConfig
getSeed() : Mila::Core::RandomGenerator, Mila::Dnn::Dropout< TDeviceType, TInput, TOutput >
getShape() : Mila::Data::SerializationMetadata, Mila::Dnn::Optimizers::SerializationMetadata, Mila::Dnn::Serialization::SerializationMetadata, Mila::Dnn::SerializationMetadata
getSharedMemoryPerBlock() : Mila::Dnn::Compute::CudaDevice
getSize() : Mila::Data::BpeVocabulary, Mila::Data::CharVocabulary, Mila::Data::TokenizerVocabulary
getSpecialTokenId() : Mila::Data::BpeVocabulary
getSpecialTokenList() : Mila::Data::BpeVocabulary
getSpecialTokens() : Mila::Data::BpeVocabularyConfig, Mila::Data::CharVocabularyConfig
getStateMemorySize() : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >, Mila::Dnn::Compute::Cuda::Rope::CudaRopeOp< TComputePrecision >, Mila::Dnn::Compute::Operation< TDeviceType, TComputePrecision >
getStepCount() : Mila::Dnn::Compute::CpuAdamWOptimizer< TPrecision >, Mila::Dnn::Compute::CudaAdamWOptimizer< TPrecision >, Mila::Dnn::Optimizers::AdamWOptimizer< TDeviceType, TPrecision >
getStorageSize() : Mila::Dnn::ITensor, Mila::Dnn::Tensor< TDataType, TMemoryResource >
getStream() : Mila::Dnn::Compute::ExecutionContext< DeviceType::Cuda >
getString() : Mila::Data::SerializationMetadata, Mila::Data::SpecialTokens, Mila::Dnn::Optimizers::SerializationMetadata, Mila::Dnn::Serialization::SerializationMetadata, Mila::Dnn::SerializationMetadata
getStringVector() : Mila::Data::SerializationMetadata, Mila::Dnn::Optimizers::SerializationMetadata, Mila::Dnn::Serialization::SerializationMetadata, Mila::Dnn::SerializationMetadata
getSymbol() : Mila::Dnn::Extensibility::PluginManager
getTensorBlobMetadata() : Mila::Dnn::Serialization::PretrainedModelReader
getTensorNames() : Mila::Dnn::Serialization::PretrainedModelReader
getTensorSizeBytes() : Mila::Dnn::Serialization::PretrainedModelReader
getTotalGlobalMemory() : Mila::Dnn::Compute::CudaDevice
getTrainingMode() : Mila::Dnn::Component< TDeviceType, TPrecision >
getType() : Mila::Dnn::Component< TDeviceType, TPrecision >, Mila::Dnn::Dropout< TDeviceType, TInput, TOutput >, Mila::Dnn::Gelu< TDeviceType, TPrecision >, Mila::Dnn::GptBlock< TDeviceType, TPrecision >, Mila::Dnn::GptTransformer< TDeviceType, TPrecision >, Mila::Dnn::GroupedQueryAttention< TDeviceType, TComputePrecision, TKvPolicy >, Mila::Dnn::LayerNorm< TDeviceType, TPrecision >, Mila::Dnn::Linear< TDeviceType, TComputePrecision, TWeightQuant >, Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >, Mila::Dnn::LlamaTransformer< TDeviceType, TPrecision, TWeightQuantization, TKvCachePolicy >, Mila::Dnn::Lpe< TDeviceType, TIndex, TPrecision >, Mila::Dnn::MLP< TDeviceType, TPrecision >, Mila::Dnn::MultiHeadAttention< TDeviceType, TPrecision >, Mila::Dnn::Network< TDeviceType, TPrecision >, Mila::Dnn::Residual< TDeviceType, TPrecision >, Mila::Dnn::RmsNorm< TDeviceType, TPrecision >, Mila::Dnn::Rope< TDeviceType, TPrecision >, Mila::Dnn::Softmax< TDeviceType, TPrecision >, Mila::Dnn::Swiglu< TDeviceType, TPrecision >, Mila::Dnn::TokenEmbedding< TDeviceType, TIndex, TPrecision >
getUId() : Mila::Dnn::ITensor, Mila::Dnn::Tensor< TDataType, TMemoryResource >
getUnderlying() : Mila::Dnn::Compute::TrackedMemoryResource
getUseBias() : Mila::Dnn::GptConfig
getValue() : Mila::Data::SerializationMetadata, Mila::Dnn::Optimizers::SerializationMetadata, Mila::Dnn::Serialization::SerializationMetadata, Mila::Dnn::SerializationMetadata
getVocab() : Mila::Data::BpeTokenizer
getVocabSize() : Mila::Data::BpeTokenizer, Mila::Data::BpeVocabularyConfig, Mila::Data::CharTokenizer, Mila::Data::Tokenizer, Mila::Dnn::CrossEntropyConfig, Mila::Dnn::GptConfig, Mila::Dnn::LlamaConfig, Mila::Dnn::SoftmaxCrossEntropy< TDeviceType, TLogits, TTargets, TPrecision >, Mila::Dnn::TokenEmbedding< TDeviceType, TIndex, TPrecision >, Mila::Dnn::TokenEmbeddingConfig
getVocabularyLength() : Mila::Dnn::Lpe< TDeviceType, TIndex, TPrecision >, Mila::Dnn::LpeConfig
getWarpSize() : Mila::Dnn::Compute::CudaDevice
getWeightCudaDataType() : Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >
getWeightDecay() : Mila::Dnn::Compute::CpuAdamWOptimizer< TPrecision >, Mila::Dnn::Compute::CudaAdamWOptimizer< TPrecision >, Mila::Dnn::Optimizers::AdamWConfig, Mila::Dnn::Optimizers::AdamWOptimizer< TDeviceType, TPrecision >
getWeightQuantization() : Mila::Dnn::LanguageModelConfig< TDerived >
getWpeGrad() : Mila::Dnn::Lpe< TDeviceType, TIndex, TPrecision >
getWteGrad() : Mila::Dnn::Lpe< TDeviceType, TIndex, TPrecision >, Mila::Dnn::TokenEmbedding< TDeviceType, TIndex, TPrecision >
GptBlock() : Mila::Dnn::GptBlock< TDeviceType, TPrecision >
GptBlockConfig() : Mila::Dnn::GptBlockConfig
GptConfig() : Mila::Dnn::GptConfig
GptModel() : Mila::Dnn::GptModel< TDeviceType, TPrecision >
gptStyle() : Mila::Data::SpecialTokens
GptTransformer() : Mila::Dnn::GptTransformer< TDeviceType, TPrecision >
GqaConfig() : Mila::Dnn::GqaConfig
GroupedQueryAttention() : Mila::Dnn::GroupedQueryAttention< TDeviceType, TComputePrecision, TKvPolicy >