Mila 0.13.48
Deep Neural Network Library
Loading...
Searching...
No Matches
Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy > Member List

This is the complete list of members for Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >, including all inherited members.

addComponent(ComponentPtr component)Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >inline
AttentionType typedefMila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >
attn_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
backward(const TensorType &input, const TensorType &output_grad)Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >inline
build(const BuildContext &context) finalMila::Dnn::Component< TDeviceType, TPrecision >inlinevirtual
build_context_Mila::Dnn::Component< TDeviceType, TPrecision >protected
built_Mila::Dnn::Component< TDeviceType, TPrecision >private
cached_input_shape_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
child_component_map_Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >private
child_components_Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >private
childCount() const noexceptMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inline
clearComponents()Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >inline
Component(const std::string &name)Mila::Dnn::Component< TDeviceType, TPrecision >inlineexplicit
ComponentBase typedefMila::Dnn::CompositeComponent< TDeviceType, TPrecision >
ComponentPtr typedefMila::Dnn::CompositeComponent< TDeviceType, TPrecision >
CompositeComponent(const std::string &name)Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >inlineexplicit
CompositeComponent(const CompositeComponent &)=deleteMila::Dnn::CompositeComponent< TDeviceType, TPrecision >
CompositeComponent(CompositeComponent &&) noexcept=defaultMila::Dnn::CompositeComponent< TDeviceType, TPrecision >
CompositeComponentBase typedefMila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >
config_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
createGraph()Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >inlineprivate
d_input_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
d_res1_accum_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
decode(const TensorType &input, int position)Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >inline
ensureBuilt(const char *method) constMila::Dnn::Component< TDeviceType, TPrecision >inlineprivate
exec_context_Mila::Dnn::Component< TDeviceType, TPrecision >private
fc_down_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
fc_gate_up_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
findComponent(const std::string &path) constMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inline
forward(const TensorType &input)Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >inline
forward_executed_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
getComponent(const std::string &name) constMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inline
getComponentAs(const std::string &name) constMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inlineprotected
getComponents() constMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inline
getDeviceId() const overrideMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inlinevirtual
getDeviceType()Mila::Dnn::Component< TDeviceType, TPrecision >inlinestatic
getExecutionContext() constMila::Dnn::Component< TDeviceType, TPrecision >inlineprotected
getGradients() const overrideMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inlinevirtual
getMemoryStats() const overrideMila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >inlinevirtual
getName() constMila::Dnn::Component< TDeviceType, TPrecision >inline
getParameterNames() constMila::Dnn::Component< TDeviceType, TPrecision >inlinevirtual
getParameters() const overrideMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inlinevirtual
getPrecision() noexceptMila::Dnn::Component< TDeviceType, TPrecision >inlinestatic
getRuntimeMode() const noexceptMila::Dnn::Component< TDeviceType, TPrecision >inline
getTrainingMode() const noexceptMila::Dnn::Component< TDeviceType, TPrecision >inline
getType() const overrideMila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >inlinevirtual
hasChildren() const noexceptMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inline
hasComponent(const std::string &name) constMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inline
hasExecutionContext() const noexceptMila::Dnn::Component< TDeviceType, TPrecision >inlineprotected
isBuilt() const finalMila::Dnn::Component< TDeviceType, TPrecision >inlinevirtual
isIdentifier(const std::string &s) noexceptMila::Dnn::Component< TDeviceType, TPrecision >inlineprivatestatic
isInferenceMode() const noexceptMila::Dnn::Component< TDeviceType, TPrecision >inline
isTrainingMode() const noexceptMila::Dnn::Component< TDeviceType, TPrecision >inline
k_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
k_prefill_shape_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
k_shape_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
last_attn_out_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
last_ffn_out_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
last_gate_up_out_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
last_out_proj_out_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
last_qkv_out_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
last_res1_out_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
last_res2_out_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
last_rms1_out_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
last_rms2_out_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
last_swiglu_out_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
LinearType typedefMila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >
LlamaBlock(const std::string &name, const LlamaConfig &config, std::optional< DeviceId > device_id=std::nullopt)Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >inlineexplicit
load_(ModelArchive &archive, SerializationMode mode)Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >inline
loadParameter(const std::string &name, const Serialization::ITensorBlob &blob)Mila::Dnn::Component< TDeviceType, TPrecision >inlinevirtual
loadParameterFromBlob(const std::string &param_name, const Serialization::ITensorBlob &blob, Tensor< TParameterPrecision, TMemoryResource > &target, const shape_t &expected_shape)Mila::Dnn::Component< TDeviceType, TPrecision >inlineprotected
MR typedefMila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >
name_Mila::Dnn::Component< TDeviceType, TPrecision >private
onBuilding(const BuildContext &context) overrideMila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >inlineprotectedvirtual
onExecutionContextSet() overrideMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inlineprotectedvirtual
onTrainingModeChanging(TrainingMode training_mode) overrideMila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >inlineprotectedvirtual
operator=(const CompositeComponent &)=deleteMila::Dnn::CompositeComponent< TDeviceType, TPrecision >
operator=(CompositeComponent &&) noexcept=defaultMila::Dnn::CompositeComponent< TDeviceType, TPrecision >
optimize()Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >inlineprotectedvirtual
out_proj_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
owned_exec_context_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
parameterCount() const overrideMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inlinevirtual
prefill(const TensorType &input, int position_offset)Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >inline
q_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
q_offset_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
q_prefill_offset_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
q_prefill_shape_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
q_shape_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
qkv_proj_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
removeComponent(const std::string &name)Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >inline
res1_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
res1_prefill_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
res2_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
resetKVCache()Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >inline
ResidualType typedefMila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >
rms1_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
rms2_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
RmsNormType typedefMila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >
rope_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
RopeType typedefMila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >
save_(ModelArchive &archive, SerializationMode mode) const overrideMila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >inlinevirtual
setExecutionContext(IExecutionContext *context)Mila::Dnn::Component< TDeviceType, TPrecision >inlineprotected
setState(const GqaState &state)Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >inline
setTrainingMode(TrainingMode mode)Mila::Dnn::Component< TDeviceType, TPrecision >inline
supportsKVCache() const noexceptMila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >inline
swiglu_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
SwiGLUType typedefMila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >
synchronize() overrideMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inlinevirtual
TensorType typedefMila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >
toString() const overrideMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inlinevirtual
training_mode_Mila::Dnn::Component< TDeviceType, TPrecision >private
training_mode_mutex_Mila::Dnn::Component< TDeviceType, TPrecision >private
tryFindComponent(const std::string &path) constMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inline
v_Mila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >private
validateBuildContext(const BuildContext &context) constMila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >inlineprivate
validateInputShape(const shape_t &input_shape) constMila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >inlineprivate
validateName(const std::string &name)Mila::Dnn::Component< TDeviceType, TPrecision >inlineprivatestatic
zeroGradients() overrideMila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >inlinevirtual
~Component()=defaultMila::Dnn::Component< TDeviceType, TPrecision >virtual
~CompositeComponent()=defaultMila::Dnn::CompositeComponent< TDeviceType, TPrecision >virtual
~LlamaBlock() override=defaultMila::Dnn::LlamaBlock< TDeviceType, TPrecision, TWeightQuant, TKvPolicy >