Here is a list of all class members with links to the classes they belong to:
- w -
- w : Mila::Dnn::Visualization::Rect
- warning() : Mila::Logging::Logger
- warp_size : Mila::Dnn::Compute::MemoryResourceTraits< CudaDeviceMemoryResource >, Mila::Dnn::Compute::MemoryResourceTraits< CudaManagedMemoryResource >, Mila::Dnn::Compute::MemoryResourceTraits< CudaPinnedMemoryResource >
- warpSize : Mila::Dnn::Compute::CudaDeviceProps
- weight_ : Mila::Dnn::Compute::CpuLayerNormOp, Mila::Dnn::Compute::CpuLinearOp, Mila::Dnn::Compute::Cuda::LayerNorm::CudaLayerNormOp< TPrecision >, Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >, Mila::Dnn::Compute::Cuda::RmsNorm::CudaRmsNormOp< TPrecision >, Mila::Dnn::LayerNorm< TDeviceType, TPrecision >, Mila::Dnn::Linear< TDeviceType, TComputePrecision, TWeightQuant >, Mila::Dnn::RmsNorm< TDeviceType, TPrecision >
- weight_decay_ : Mila::Dnn::Optimizers::AdamWConfig
- weight_grad_ : Mila::Dnn::Compute::CpuLayerNormOp, Mila::Dnn::Compute::CpuLinearOp, Mila::Dnn::Compute::Cuda::LayerNorm::CudaLayerNormOp< TPrecision >, Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >, Mila::Dnn::Compute::Cuda::RmsNorm::CudaRmsNormOp< TPrecision >, Mila::Dnn::LayerNorm< TDeviceType, TPrecision >, Mila::Dnn::Linear< TDeviceType, TComputePrecision, TWeightQuant >, Mila::Dnn::RmsNorm< TDeviceType, TPrecision >
- weight_group_size_ : Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >
- weight_in_features_ : Mila::Dnn::Compute::CpuLinearOp, Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >
- weight_out_features_ : Mila::Dnn::Compute::CpuLinearOp, Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >
- weight_quantization_ : Mila::Dnn::LanguageModelConfig< TDerived >
- weight_scales_ : Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >, Mila::Dnn::Linear< TDeviceType, TComputePrecision, TWeightQuant >
- weight_size_ : Mila::Dnn::Compute::Cuda::LayerNorm::CudaLayerNormOp< TPrecision >
- weight_zero_points_ : Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >
- WeightScaleTensorType : Mila::Dnn::Linear< TDeviceType, TComputePrecision, TWeightQuant >
- WeightTensorType : Mila::Dnn::Linear< TDeviceType, TComputePrecision, TWeightQuant >
- WeightType : Mila::Dnn::Compute::Cuda::Linear::CudaLinearOp< TComputePrecision, TWeightQuant >
- what() : Mila::Dnn::Compute::CudaBadAlloc
- width : Mila::Dnn::Visualization::Framebuffer
- window_size_tokens_ : Mila::Data::TokenSequenceLoader< TMemoryResource >
- windowSizeTokens() : Mila::Data::TokenSequenceLoader< TMemoryResource >
- withActivation() : Mila::Dnn::GptBlockConfig, Mila::Dnn::MLPConfig
- withApproximationMethod() : Mila::Dnn::GeluConfig
- withAxis() : Mila::Dnn::SoftmaxConfig
- withBase() : Mila::Dnn::RopeConfig
- withBeta1() : Mila::Dnn::Optimizers::AdamWConfig
- withBeta2() : Mila::Dnn::Optimizers::AdamWConfig
- withBias() : Mila::Dnn::GptBlockConfig, Mila::Dnn::GptConfig, Mila::Dnn::LayerNormConfig, Mila::Dnn::LinearConfig, Mila::Dnn::LlamaConfig, Mila::Dnn::MLPConfig, Mila::Dnn::RmsNormConfig
- withByteLevel() : Mila::Data::BpeVocabularyConfig, Mila::Data::CharVocabularyConfig
- withCaseSensitive() : Mila::Data::CharVocabularyConfig
- withConnectionType() : Mila::Dnn::ResidualConfig
- withContextLength() : Mila::Dnn::LanguageModelConfig< TDerived >, Mila::Dnn::ModelConfig
- withEmbeddingDim() : Mila::Dnn::LpeConfig, Mila::Dnn::TokenEmbeddingConfig
- withEpsilon() : Mila::Dnn::LayerNormConfig, Mila::Dnn::Optimizers::AdamWConfig, Mila::Dnn::RmsNormConfig
- withFP4Quantization() : Mila::Dnn::LanguageModelConfig< TDerived >
- withFP8Quantization() : Mila::Dnn::LanguageModelConfig< TDerived >
- withFullPrecision() : Mila::Dnn::LanguageModelConfig< TDerived >
- withHiddenDimension() : Mila::Dnn::LlamaConfig
- withHiddenSize() : Mila::Dnn::GptBlockConfig, Mila::Dnn::GptConfig
- withInputFeatures() : Mila::Dnn::LinearConfig
- withKvCacheCompression() : Mila::Dnn::LanguageModelConfig< TDerived >
- withLearningRate() : Mila::Dnn::Optimizers::AdamWConfig
- withMaxMerges() : Mila::Data::BpeVocabularyConfig
- withMaxSequenceLength() : Mila::Dnn::GptBlockConfig, Mila::Dnn::GptConfig, Mila::Dnn::LlamaConfig, Mila::Dnn::LpeConfig
- withMergeCaching() : Mila::Data::BpeVocabularyConfig
- withMinFrequency() : Mila::Data::BpeVocabularyConfig
- withModelDim() : Mila::Dnn::GqaConfig, Mila::Dnn::MultiHeadAttentionConfig
- withNormalizeUnicode() : Mila::Data::CharVocabularyConfig
- withNumHeads() : Mila::Dnn::GptConfig, Mila::Dnn::GqaConfig, Mila::Dnn::LlamaConfig, Mila::Dnn::MultiHeadAttentionConfig
- withNumKVHeads() : Mila::Dnn::LlamaConfig
- withNumKvHeads() : Mila::Dnn::GqaConfig
- withNumLayers() : Mila::Dnn::GptConfig
- withOutputFeatures() : Mila::Dnn::LinearConfig
- withPrefillSize() : Mila::Dnn::BuildContext
- withPreTokenization() : Mila::Data::BpeVocabularyConfig
- withPreTokenizationPattern() : Mila::Data::BpeVocabularyConfig
- withProbability() : Mila::Dnn::DropoutConfig
- withResidualScale() : Mila::Dnn::GptBlockConfig
- withRoPEScalingFactor() : Mila::Dnn::LlamaConfig
- withRoPETheta() : Mila::Dnn::LlamaConfig
- withRotaryDim() : Mila::Dnn::RopeConfig
- withSameMaskPerBatch() : Mila::Dnn::DropoutConfig
- withScalingDuringInference() : Mila::Dnn::DropoutConfig
- withScalingFactor() : Mila::Dnn::ResidualConfig
- withShape() : Mila::Dnn::BuildContext
- withSpecialTokens() : Mila::Data::BpeVocabularyConfig, Mila::Data::CharVocabularyConfig
- withVocabSize() : Mila::Data::BpeVocabularyConfig, Mila::Dnn::CrossEntropyConfig, Mila::Dnn::GptConfig, Mila::Dnn::TokenEmbeddingConfig
- withVocabularyLength() : Mila::Dnn::LlamaConfig, Mila::Dnn::LpeConfig
- withWeightDecay() : Mila::Dnn::Optimizers::AdamWConfig
- withWeightQuantization() : Mila::Dnn::LanguageModelConfig< TDerived >
- wpe_ : Mila::Dnn::Compute::CpuEncoderOp, Mila::Dnn::Compute::Cuda::Lpe::CudaLpeOp< TInput, TPrecision >, Mila::Dnn::Lpe< TDeviceType, TIndex, TPrecision >
- wpe_embedding_dim_ : Mila::Dnn::Compute::Cuda::Lpe::CudaLpeOp< TInput, TPrecision >
- wpe_grad_ : Mila::Dnn::Compute::CpuEncoderOp, Mila::Dnn::Compute::Cuda::Lpe::CudaLpeOp< TInput, TPrecision >, Mila::Dnn::Lpe< TDeviceType, TIndex, TPrecision >
- wpe_max_seq_len_ : Mila::Dnn::Compute::Cuda::Lpe::CudaLpeOp< TInput, TPrecision >
- write() : Mila::Data::MilaFileHeader
- writeBlob() : Mila::Dnn::Serialization::ModelArchive
- writeMetadata() : Mila::Dnn::Serialization::ModelArchive
- wte_ : Mila::Dnn::Compute::CpuEncoderOp, Mila::Dnn::Compute::Cuda::Lpe::CudaLpeOp< TInput, TPrecision >, Mila::Dnn::Compute::Cuda::TokenEmbedding::CudaTokenEmbeddingOp< TInput, TPrecision >, Mila::Dnn::Lpe< TDeviceType, TIndex, TPrecision >, Mila::Dnn::TokenEmbedding< TDeviceType, TIndex, TPrecision >
- wte_embedding_dim_ : Mila::Dnn::Compute::Cuda::Lpe::CudaLpeOp< TInput, TPrecision >
- wte_grad_ : Mila::Dnn::Compute::CpuEncoderOp, Mila::Dnn::Compute::Cuda::Lpe::CudaLpeOp< TInput, TPrecision >, Mila::Dnn::Compute::Cuda::TokenEmbedding::CudaTokenEmbeddingOp< TInput, TPrecision >, Mila::Dnn::Lpe< TDeviceType, TIndex, TPrecision >, Mila::Dnn::TokenEmbedding< TDeviceType, TIndex, TPrecision >
- wte_vocab_size_ : Mila::Dnn::Compute::Cuda::Lpe::CudaLpeOp< TInput, TPrecision >