Mila 0.13.48
Deep Neural Network Library
Loading...
Searching...
No Matches
Mila::Dnn::GptTransformer< TDeviceType, TPrecision > Member List

This is the complete list of members for Mila::Dnn::GptTransformer< TDeviceType, TPrecision >, including all inherited members.

addComponent(ComponentPtr component)Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >inline
backward(const TokenIndexType &input, const TensorType &output_grad) overrideMila::Dnn::GptTransformer< TDeviceType, TPrecision >inline
Mila::Dnn::LanguageNetwork::backward(const TokenIndexType &input, const TensorType &output_grad)=0Mila::Dnn::LanguageNetwork< TDeviceType, TPrecision >pure virtual
batch_size_Mila::Dnn::GptTransformer< TDeviceType, TPrecision >private
block_input_ptrs_Mila::Dnn::GptTransformer< TDeviceType, TPrecision >private
block_output_ptrs_Mila::Dnn::GptTransformer< TDeviceType, TPrecision >private
build(const BuildContext &context) finalMila::Dnn::Component< TDeviceType, TPrecision >inlinevirtual
build_context_Mila::Dnn::Component< TDeviceType, TPrecision >protected
built_Mila::Dnn::Component< TDeviceType, TPrecision >private
child_component_map_Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >private
child_components_Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >private
childCount() const noexceptMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inline
clearComponents()Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >inline
Component(const std::string &name)Mila::Dnn::Component< TDeviceType, TPrecision >inlineexplicit
ComponentBase typedefMila::Dnn::CompositeComponent< TDeviceType, TPrecision >
ComponentPtr typedefMila::Dnn::GptTransformer< TDeviceType, TPrecision >
CompositeBase typedefMila::Dnn::Network< TDeviceType, TPrecision >
CompositeComponent(const std::string &name)Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >inlineexplicit
CompositeComponent(const CompositeComponent &)=deleteMila::Dnn::CompositeComponent< TDeviceType, TPrecision >
CompositeComponent(CompositeComponent &&) noexcept=defaultMila::Dnn::CompositeComponent< TDeviceType, TPrecision >
config_Mila::Dnn::GptTransformer< TDeviceType, TPrecision >private
createConfigFromMetadata(const PretrainedMetadata &metadata) -> GptConfigMila::Dnn::GptTransformer< TDeviceType, TPrecision >inlineprivatestatic
createGraph()Mila::Dnn::GptTransformer< TDeviceType, TPrecision >inlineprivate
createOptimizer(const TConfig &config)Mila::Dnn::Network< TDeviceType, TPrecision >inline
decode(const TokenIndexType &input, int position) overrideMila::Dnn::GptTransformer< TDeviceType, TPrecision >inline
Mila::Dnn::LanguageNetwork::decode(const TokenIndexType &input, int position)=0Mila::Dnn::LanguageNetwork< TDeviceType, TPrecision >pure virtual
embedding_shape_Mila::Dnn::GptTransformer< TDeviceType, TPrecision >private
encoder_Mila::Dnn::GptTransformer< TDeviceType, TPrecision >private
encoder_out_ptr_Mila::Dnn::GptTransformer< TDeviceType, TPrecision >private
EncoderType typedefMila::Dnn::GptTransformer< TDeviceType, TPrecision >
ensureBuilt(const char *method) constMila::Dnn::Component< TDeviceType, TPrecision >inlineprivate
exec_context_Mila::Dnn::Component< TDeviceType, TPrecision >private
final_layernorm_Mila::Dnn::GptTransformer< TDeviceType, TPrecision >private
findComponent(const std::string &path) constMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inline
forward(const TokenIndexType &input) overrideMila::Dnn::GptTransformer< TDeviceType, TPrecision >inline
Mila::Dnn::LanguageNetwork::forward(const TokenIndexType &input)=0Mila::Dnn::LanguageNetwork< TDeviceType, TPrecision >pure virtual
fromPretrained(const std::filesystem::path &model_path, std::size_t batch_size, std::size_t seq_length, DeviceId device_id=DeviceId{ TDeviceType, 0 }, bool strict=true)Mila::Dnn::GptTransformer< TDeviceType, TPrecision >inlinestatic
getComponent(const std::string &name) constMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inline
getComponentAs(const std::string &name) constMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inlineprotected
getComponents() constMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inline
getDeviceId() const noexceptMila::Dnn::Network< TDeviceType, TPrecision >inlinevirtual
getDeviceType()Mila::Dnn::Component< TDeviceType, TPrecision >inlinestatic
getExecutionContext() constMila::Dnn::GptTransformer< TDeviceType, TPrecision >inline
getGradients() const overrideMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inlinevirtual
getMemoryStats() const overrideMila::Dnn::GptTransformer< TDeviceType, TPrecision >inlinevirtual
getName() constMila::Dnn::Component< TDeviceType, TPrecision >inline
getParameterNames() constMila::Dnn::Component< TDeviceType, TPrecision >inlinevirtual
getParameters() const overrideMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inlinevirtual
getPrecision() noexceptMila::Dnn::Component< TDeviceType, TPrecision >inlinestatic
getRuntimeMode() const noexceptMila::Dnn::Component< TDeviceType, TPrecision >inline
getTrainingMode() const noexceptMila::Dnn::Component< TDeviceType, TPrecision >inline
getType() const overrideMila::Dnn::GptTransformer< TDeviceType, TPrecision >inlinevirtual
GptTransformer(const std::string &name, const GptConfig &config, DeviceId device_id)Mila::Dnn::GptTransformer< TDeviceType, TPrecision >inlineexplicit
hasChildren() const noexceptMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inline
hasComponent(const std::string &name) constMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inline
hasExecutionContext() const noexceptMila::Dnn::Component< TDeviceType, TPrecision >inlineprotected
isBuilt() const finalMila::Dnn::Component< TDeviceType, TPrecision >inlinevirtual
isIdentifier(const std::string &s) noexceptMila::Dnn::Component< TDeviceType, TPrecision >inlineprivatestatic
isInferenceMode() const noexceptMila::Dnn::Component< TDeviceType, TPrecision >inline
isTrainingMode() const noexceptMila::Dnn::Component< TDeviceType, TPrecision >inline
LanguageNetwork(const std::string &name)Mila::Dnn::LanguageNetwork< TDeviceType, TPrecision >inlineexplicit
LayerNormType typedefMila::Dnn::GptTransformer< TDeviceType, TPrecision >
leading_shape_Mila::Dnn::GptTransformer< TDeviceType, TPrecision >private
LinearType typedefMila::Dnn::GptTransformer< TDeviceType, TPrecision >
lm_head_Mila::Dnn::GptTransformer< TDeviceType, TPrecision >private
loadParameter(const std::string &name, const Serialization::ITensorBlob &blob)Mila::Dnn::Component< TDeviceType, TPrecision >inlinevirtual
loadParameterFromBlob(const std::string &param_name, const Serialization::ITensorBlob &blob, Tensor< TParameterPrecision, TMemoryResource > &target, const shape_t &expected_shape)Mila::Dnn::Component< TDeviceType, TPrecision >inlineprotected
loadParameters(PretrainedModelReader &reader, bool strict)Mila::Dnn::GptTransformer< TDeviceType, TPrecision >inline
logits_ptr_Mila::Dnn::GptTransformer< TDeviceType, TPrecision >private
MR typedefMila::Dnn::GptTransformer< TDeviceType, TPrecision >
name_Mila::Dnn::Component< TDeviceType, TPrecision >private
Network(const std::string &name)Mila::Dnn::Network< TDeviceType, TPrecision >inlineexplicit
NetworkBase typedefMila::Dnn::GptTransformer< TDeviceType, TPrecision >
normalized_ptr_Mila::Dnn::GptTransformer< TDeviceType, TPrecision >private
onBuilding(const BuildContext &context) overrideMila::Dnn::GptTransformer< TDeviceType, TPrecision >inlineprotectedvirtual
onExecutionContextSet() overrideMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inlineprotectedvirtual
onTrainingModeChanging(TrainingMode training_mode) overrideMila::Dnn::GptTransformer< TDeviceType, TPrecision >inlineprotectedvirtual
operator=(const CompositeComponent &)=deleteMila::Dnn::CompositeComponent< TDeviceType, TPrecision >
operator=(CompositeComponent &&) noexcept=defaultMila::Dnn::CompositeComponent< TDeviceType, TPrecision >
optimize()Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >inlineprotectedvirtual
output_shape_Mila::Dnn::GptTransformer< TDeviceType, TPrecision >private
owned_context_Mila::Dnn::GptTransformer< TDeviceType, TPrecision >private
parameterCount() const overrideMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inlinevirtual
parseLayerIndex(const std::string &name)Mila::Dnn::Network< TDeviceType, TPrecision >inlineprivate
parseParameterPath(const std::string &full_name) constMila::Dnn::GptTransformer< TDeviceType, TPrecision >inlineprivate
parseTensorName(const std::string &tensor_name)Mila::Dnn::Network< TDeviceType, TPrecision >inlineprivate
prefill(const TokenIndexType &input) overrideMila::Dnn::GptTransformer< TDeviceType, TPrecision >inline
Mila::Dnn::LanguageNetwork::prefill(const TokenIndexType &input)=0Mila::Dnn::LanguageNetwork< TDeviceType, TPrecision >pure virtual
removeComponent(const std::string &name)Mila::Dnn::CompositeComponent< TDeviceType, TPrecision >inline
save(ModelArchive &archive, SerializationMode mode) constMila::Dnn::Network< TDeviceType, TPrecision >inline
save_(ModelArchive &archive, SerializationMode) const overrideMila::Dnn::GptTransformer< TDeviceType, TPrecision >inlineprotectedvirtual
saveComponentGraph(ModelArchive &archive, SerializationMode mode) constMila::Dnn::Network< TDeviceType, TPrecision >inlineprivate
saveNetworkMetadata(ModelArchive &archive, SerializationMode mode) constMila::Dnn::Network< TDeviceType, TPrecision >inlineprivate
seq_length_Mila::Dnn::GptTransformer< TDeviceType, TPrecision >private
setExecutionContext(IExecutionContext *context)Mila::Dnn::Component< TDeviceType, TPrecision >inlineprotected
setTrainingMode(TrainingMode mode)Mila::Dnn::Component< TDeviceType, TPrecision >inline
synchronize() overrideMila::Dnn::Network< TDeviceType, TPrecision >inlinevirtual
TensorType typedefMila::Dnn::GptTransformer< TDeviceType, TPrecision >
TokenIndexType typedefMila::Dnn::GptTransformer< TDeviceType, TPrecision >
toString() const overrideMila::Dnn::GptTransformer< TDeviceType, TPrecision >inlinevirtual
training_mode_Mila::Dnn::Component< TDeviceType, TPrecision >private
training_mode_mutex_Mila::Dnn::Component< TDeviceType, TPrecision >private
transformer_blocks_Mila::Dnn::GptTransformer< TDeviceType, TPrecision >private
TransformerBlockType typedefMila::Dnn::GptTransformer< TDeviceType, TPrecision >
tryFindComponent(const std::string &path) constMila::Dnn::CompositeComponent< TDeviceType, TPrecision >inline
validateBuildContext(const BuildContext &context) constMila::Dnn::GptTransformer< TDeviceType, TPrecision >inlineprivate
validateInputShape(const shape_t &input_shape) constMila::Dnn::GptTransformer< TDeviceType, TPrecision >inlineprivate
validateName(const std::string &name)Mila::Dnn::Component< TDeviceType, TPrecision >inlineprivatestatic
verifyArchitectureCompatibility(const PretrainedMetadata &metadata)Mila::Dnn::Network< TDeviceType, TPrecision >inlineprotected
zeroGradients() overrideMila::Dnn::GptTransformer< TDeviceType, TPrecision >inlinevirtual
~Component()=defaultMila::Dnn::Component< TDeviceType, TPrecision >virtual
~CompositeComponent()=defaultMila::Dnn::CompositeComponent< TDeviceType, TPrecision >virtual
~GptTransformer() override=defaultMila::Dnn::GptTransformer< TDeviceType, TPrecision >
~LanguageNetwork() override=defaultMila::Dnn::LanguageNetwork< TDeviceType, TPrecision >
~Network() override=defaultMila::Dnn::Network< TDeviceType, TPrecision >