Here is a list of all class members with links to the classes they belong to:
- p -
- pad_token : Mila::Data::SpecialTokens
- pad_token_id_ : Mila::Data::CharVocabulary
- padTokenId() : Mila::Data::CharVocabulary
- paired_registry_ : Mila::Dnn::Compute::OperationRegistry
- param_data_ : Mila::Dnn::Compute::CpuAdamWOptimizer< TPrecision >, Mila::Dnn::Compute::CudaAdamWOptimizer< TPrecision >
- parameterCount() : Mila::Dnn::Component< TDeviceType, TPrecision >, Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >, Mila::Dnn::Dropout< TDeviceType, TInput, TOutput >, Mila::Dnn::FusedComponent< TDeviceType, TPrecision >, Mila::Dnn::Gelu< TDeviceType, TPrecision >, Mila::Dnn::GroupedQueryAttention< TDeviceType, TComputePrecision, TKvPolicy >, Mila::Dnn::LayerNorm< TDeviceType, TPrecision >, Mila::Dnn::Linear< TDeviceType, TComputePrecision, TWeightQuant >, Mila::Dnn::Lpe< TDeviceType, TIndex, TPrecision >, Mila::Dnn::MultiHeadAttention< TDeviceType, TPrecision >, Mila::Dnn::Residual< TDeviceType, TPrecision >, Mila::Dnn::RmsNorm< TDeviceType, TPrecision >, Mila::Dnn::Rope< TDeviceType, TPrecision >, Mila::Dnn::Softmax< TDeviceType, TPrecision >, Mila::Dnn::SoftmaxCrossEntropy< TDeviceType, TLogits, TTargets, TPrecision >, Mila::Dnn::Swiglu< TDeviceType, TPrecision >, Mila::Dnn::TokenEmbedding< TDeviceType, TIndex, TPrecision >
- ParameterGradTensor : Mila::Dnn::Compute::BinaryOperation< TDeviceType, TPrecision, TInputA, TInputB >
- parameters_ : Mila::Dnn::Dropout< TDeviceType, TInput, TOutput >, Mila::Dnn::FusedComponent< TDeviceType, TPrecision >
- ParameterTensor : Mila::Dnn::Compute::BinaryOperation< TDeviceType, TPrecision, TInputA, TInputB >
- ParameterType : Mila::Dnn::Compute::Cuda::CublasLtLinearPlan< TComputePrecision, TParameterPrecision >
- params_ : Mila::Dnn::Compute::CpuAdamWOptimizer< TPrecision >, Mila::Dnn::Compute::CudaAdamWOptimizer< TPrecision >
- parse() : Mila::Dnn::Compute::DeviceId
- parseComponentType() : Mila::Dnn::ComponentFactory
- parseLayerIndex() : Mila::Dnn::Network< TDeviceType, TPrecision >
- parseMetadataJSON() : Mila::Dnn::Serialization::PretrainedModelReader
- parseParameterPath() : Mila::Dnn::GptTransformer< TDeviceType, TPrecision >, Mila::Dnn::LlamaTransformer< TDeviceType, TPrecision, TWeightQuantization, TKvCachePolicy >
- parseTensorName() : Mila::Dnn::Network< TDeviceType, TPrecision >
- patch_ : Mila::Version
- path : Mila::Dnn::Extensibility::PluginManager::PluginEntry, Mila::Logging::FileSink
- path_ : Mila::Logging::FileSink
- pciBusID : Mila::Dnn::Compute::CudaDeviceProps
- pciDeviceID : Mila::Dnn::Compute::CudaDeviceProps
- pciDomainID : Mila::Dnn::Compute::CudaDeviceProps
- peakUsage : Mila::Dnn::Compute::MemoryStats
- performElementwiseOperation() : Mila::Dnn::Compute::Cpu::MathOps
- permute_backward() : Mila::Dnn::Compute::CpuAttentionOp, Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< float >, Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< nv_bfloat16 >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::Detail::cuda_mha_kernels< float >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::Detail::cuda_mha_kernels< half >
- permute_kv() : Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< float >
- permute_q_compact() : Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< float >, Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< nv_bfloat16 >
- permute_qkv() : Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< float >, Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< nv_bfloat16 >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::Detail::cuda_mha_kernels< float >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::Detail::cuda_mha_kernels< half >
- permute_qkv_decode() : Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< float >, Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< nv_bfloat16 >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::Detail::cuda_mha_kernels< float >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::Detail::cuda_mha_kernels< half >
- permute_qkv_padded() : Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< float >, Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< nv_bfloat16 >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::Detail::cuda_mha_kernels< float >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::Detail::cuda_mha_kernels< half >
- permuteQKV() : Mila::Dnn::Compute::CpuAttentionOp
- pinned_staging_buf_ : Mila::Dnn::Compute::ExecutionContext< DeviceType::Cuda >
- pinned_staging_size_ : Mila::Dnn::Compute::ExecutionContext< DeviceType::Cuda >
- pixelPtr() : Mila::Dnn::Visualization::Framebuffer
- pixels : Mila::Dnn::Visualization::Framebuffer
- PlanBuilder : Mila::Dnn::Compute::Cuda::CublasLtPlanCache< TPlan >
- plugin : Mila::Dnn::Extensibility::PluginManager::PluginEntry
- PLUGIN_EXTENSION : Mila::Dnn::Extensibility::PluginManager
- plugins_ : Mila::Dnn::Extensibility::PluginManager
- popScope() : Mila::Dnn::Serialization::ModelArchive
- positional_encoding : Mila::Dnn::Serialization::PretrainedMetadata
- positional_op_ : Mila::Dnn::GroupedQueryAttention< TDeviceType, TComputePrecision, TKvPolicy >, Mila::Dnn::MultiHeadAttention< TDeviceType, TPrecision >, Mila::Dnn::Rope< TDeviceType, TPrecision >
- pre_release_tag_ : Mila::Version
- pre_tokenization_mode_ : Mila::Data::BpeVocabularyConfig
- pre_tokenization_pattern_ : Mila::Data::BpeVocabularyConfig
- pre_tokenization_regex_ : Mila::Data::BpeTokenizer
- preatt : Mila::Dnn::Compute::GqaState
- preatt_ : Mila::Dnn::Compute::CpuAttentionOp, Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::CudaMultiHeadAttentionOp< TPrecision >
- preatt_decode : Mila::Dnn::Compute::GqaState
- preatt_decode_ : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::CudaMultiHeadAttentionOp< TPrecision >
- preatt_decode_opt_ : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >
- preatt_decode_tensor_ : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::CudaMultiHeadAttentionOp< TPrecision >
- preatt_opt_ : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >
- preatt_tensor_ : Mila::Dnn::Compute::CpuAttentionOp, Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::CudaMultiHeadAttentionOp< TPrecision >
- preatt_tensor_optimized_ : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >
- precision : Mila::Dnn::Compute::Cuda::Rope::RopeCacheRegistry::CacheKey
- preference : Mila::Dnn::Compute::Cuda::CublasLtLinearPlan< TComputePrecision, TParameterPrecision >, Mila::Dnn::Compute::Cuda::CublasLtMatMulPlan< TComputePrecision >
- preferred_alignment : Mila::Dnn::Compute::MemoryResourceTraits< CpuMemoryResource >, Mila::Dnn::Compute::MemoryResourceTraits< CudaDeviceMemoryResource >, Mila::Dnn::Compute::MemoryResourceTraits< CudaManagedMemoryResource >, Mila::Dnn::Compute::MemoryResourceTraits< CudaPinnedMemoryResource >
- preferred_allocation_strategy() : Mila::Dnn::VulkanTensorTraits
- prefill() : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::CudaMultiHeadAttentionOp< TPrecision >, Mila::Dnn::Compute::Cuda::Rope::CudaRopeOp< TComputePrecision >, Mila::Dnn::Compute::IKvInference, Mila::Dnn::Compute::IPackedKvInference, Mila::Dnn::Compute::IPositionalPairedOp, Mila::Dnn::GptTransformer< TDeviceType, TPrecision >, Mila::Dnn::GroupedQueryAttention< TDeviceType, TComputePrecision, TKvPolicy >, Mila::Dnn::LanguageNetwork< TDeviceType, TPrecision >, Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >, Mila::Dnn::LlamaTransformer< TDeviceType, TPrecision, TWeightQuantization, TKvCachePolicy >, Mila::Dnn::Rope< TDeviceType, TPrecision >
- prefill_ : Mila::Dnn::LlamaTransformer< TDeviceType, TPrecision, TWeightQuantization, TKvCachePolicy >
- prefill_chunk_size_ : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >, Mila::Dnn::LlamaTransformer< TDeviceType, TPrecision, TWeightQuantization, TKvCachePolicy >
- prefill_optimized() : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >
- prefill_permute_qkv() : Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< nv_bfloat16 >
- prefill_size_ : Mila::Dnn::BuildContext
- prefill_softmax() : Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< float >, Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< nv_bfloat16 >
- prefill_time_ms : Mila::Dnn::GenerationStatistics
- prefill_unpermute_output_padded() : Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< float >, Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< nv_bfloat16 >
- prefillImpl() : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >
- prepareSequenceIndices() : Mila::Data::TokenSequenceLoader< TMemoryResource >
- preTokenize() : Mila::Data::BpeTokenizer, Mila::Data::BpeVocabulary
- preTokenizeCorpus() : Mila::Data::BpeVocabulary
- PretrainedModelReader() : Mila::Dnn::Serialization::PretrainedModelReader
- print() : Mila::Dnn::Compute::MemoryStats
- probability_ : Mila::Dnn::DropoutConfig
- producer_exception_ : Mila::Data::TokenSequenceLoader< TMemoryResource >
- producer_thread_ : Mila::Data::TokenSequenceLoader< TMemoryResource >
- producerThreadFunc() : Mila::Data::TokenSequenceLoader< TMemoryResource >
- profilePrefill() : Mila::Dnn::LlamaModel< TDeviceType, TPrecision >
- prompt_tokens : Mila::Dnn::GenerationStatistics
- props_ : Mila::Dnn::Compute::CudaDevice
- pushScope() : Mila::Dnn::Serialization::ModelArchive