Here is a list of all functions with links to the classes they belong to:
- p -
- padTokenId() : Mila::Data::CharVocabulary
- parameterCount() : Mila::Dnn::Component< TDeviceType, TPrecision >, Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >, Mila::Dnn::Dropout< TDeviceType, TInput, TOutput >, Mila::Dnn::FusedComponent< TDeviceType, TPrecision >, Mila::Dnn::Gelu< TDeviceType, TPrecision >, Mila::Dnn::GroupedQueryAttention< TDeviceType, TComputePrecision, TKvPolicy >, Mila::Dnn::LayerNorm< TDeviceType, TPrecision >, Mila::Dnn::Linear< TDeviceType, TComputePrecision, TWeightQuant >, Mila::Dnn::Lpe< TDeviceType, TIndex, TPrecision >, Mila::Dnn::MultiHeadAttention< TDeviceType, TPrecision >, Mila::Dnn::Residual< TDeviceType, TPrecision >, Mila::Dnn::RmsNorm< TDeviceType, TPrecision >, Mila::Dnn::Rope< TDeviceType, TPrecision >, Mila::Dnn::Softmax< TDeviceType, TPrecision >, Mila::Dnn::SoftmaxCrossEntropy< TDeviceType, TLogits, TTargets, TPrecision >, Mila::Dnn::Swiglu< TDeviceType, TPrecision >, Mila::Dnn::TokenEmbedding< TDeviceType, TIndex, TPrecision >
- parse() : Mila::Dnn::Compute::DeviceId
- parseComponentType() : Mila::Dnn::ComponentFactory
- parseLayerIndex() : Mila::Dnn::Network< TDeviceType, TPrecision >
- parseMetadataJSON() : Mila::Dnn::Serialization::PretrainedModelReader
- parseParameterPath() : Mila::Dnn::GptTransformer< TDeviceType, TPrecision >, Mila::Dnn::LlamaTransformer< TDeviceType, TPrecision, TWeightQuantization, TKvCachePolicy >
- parseTensorName() : Mila::Dnn::Network< TDeviceType, TPrecision >
- path() : Mila::Logging::FileSink
- performElementwiseOperation() : Mila::Dnn::Compute::Cpu::MathOps
- permute_backward() : Mila::Dnn::Compute::CpuAttentionOp, Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< float >, Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< nv_bfloat16 >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::Detail::cuda_mha_kernels< float >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::Detail::cuda_mha_kernels< half >
- permute_kv() : Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< float >
- permute_q_compact() : Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< float >, Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< nv_bfloat16 >
- permute_qkv() : Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< float >, Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< nv_bfloat16 >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::Detail::cuda_mha_kernels< float >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::Detail::cuda_mha_kernels< half >
- permute_qkv_decode() : Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< float >, Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< nv_bfloat16 >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::Detail::cuda_mha_kernels< float >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::Detail::cuda_mha_kernels< half >
- permute_qkv_padded() : Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< float >, Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< nv_bfloat16 >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::Detail::cuda_mha_kernels< float >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::Detail::cuda_mha_kernels< half >
- permuteQKV() : Mila::Dnn::Compute::CpuAttentionOp
- pixelPtr() : Mila::Dnn::Visualization::Framebuffer
- popScope() : Mila::Dnn::Serialization::ModelArchive
- preferred_allocation_strategy() : Mila::Dnn::VulkanTensorTraits
- prefill() : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >, Mila::Dnn::Compute::Cuda::MultiHeadAttention::CudaMultiHeadAttentionOp< TPrecision >, Mila::Dnn::Compute::Cuda::Rope::CudaRopeOp< TComputePrecision >, Mila::Dnn::Compute::IKvInference, Mila::Dnn::Compute::IPackedKvInference, Mila::Dnn::Compute::IPositionalPairedOp, Mila::Dnn::GptTransformer< TDeviceType, TPrecision >, Mila::Dnn::GroupedQueryAttention< TDeviceType, TComputePrecision, TKvPolicy >, Mila::Dnn::LanguageNetwork< TDeviceType, TPrecision >, Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >, Mila::Dnn::LlamaTransformer< TDeviceType, TPrecision, TWeightQuantization, TKvCachePolicy >, Mila::Dnn::Rope< TDeviceType, TPrecision >
- prefill_optimized() : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >
- prefill_permute_qkv() : Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< nv_bfloat16 >
- prefill_softmax() : Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< float >, Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< nv_bfloat16 >
- prefill_unpermute_output_padded() : Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< float >, Mila::Dnn::Compute::Cuda::Gqa::Detail::cuda_gqa_kernels< nv_bfloat16 >
- prefillImpl() : Mila::Dnn::Compute::Cuda::Gqa::CudaGqaOp< TPrecision >
- prepareSequenceIndices() : Mila::Data::TokenSequenceLoader< TMemoryResource >
- preTokenize() : Mila::Data::BpeTokenizer, Mila::Data::BpeVocabulary
- preTokenizeCorpus() : Mila::Data::BpeVocabulary
- PretrainedModelReader() : Mila::Dnn::Serialization::PretrainedModelReader
- print() : Mila::Dnn::Compute::MemoryStats
- producerThreadFunc() : Mila::Data::TokenSequenceLoader< TMemoryResource >
- profilePrefill() : Mila::Dnn::LlamaModel< TDeviceType, TPrecision >
- pushScope() : Mila::Dnn::Serialization::ModelArchive