| addComponent(ComponentPtr component) | Mila::Dnn::CompositeComponent< TDeviceType, TPrecision > | inline |
| backward(const TokenIndexType &input, const TensorType &output_grad) override | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | inline |
| Mila::Dnn::LanguageNetwork::backward(const TokenIndexType &input, const TensorType &output_grad)=0 | Mila::Dnn::LanguageNetwork< TDeviceType, TPrecision > | pure virtual |
| batch_size_ | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | private |
| block_input_ptrs_ | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | private |
| block_output_ptrs_ | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | private |
| build(const BuildContext &context) final | Mila::Dnn::Component< TDeviceType, TPrecision > | inlinevirtual |
| build_context_ | Mila::Dnn::Component< TDeviceType, TPrecision > | protected |
| built_ | Mila::Dnn::Component< TDeviceType, TPrecision > | private |
| child_component_map_ | Mila::Dnn::CompositeComponent< TDeviceType, TPrecision > | private |
| child_components_ | Mila::Dnn::CompositeComponent< TDeviceType, TPrecision > | private |
| childCount() const noexcept | Mila::Dnn::CompositeComponent< TDeviceType, TPrecision > | inline |
| clearComponents() | Mila::Dnn::CompositeComponent< TDeviceType, TPrecision > | inline |
| Component(const std::string &name) | Mila::Dnn::Component< TDeviceType, TPrecision > | inlineexplicit |
| ComponentBase typedef | Mila::Dnn::CompositeComponent< TDeviceType, TPrecision > | |
| ComponentPtr typedef | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | |
| CompositeBase typedef | Mila::Dnn::Network< TDeviceType, TPrecision > | |
| CompositeComponent(const std::string &name) | Mila::Dnn::CompositeComponent< TDeviceType, TPrecision > | inlineexplicit |
| CompositeComponent(const CompositeComponent &)=delete | Mila::Dnn::CompositeComponent< TDeviceType, TPrecision > | |
| CompositeComponent(CompositeComponent &&) noexcept=default | Mila::Dnn::CompositeComponent< TDeviceType, TPrecision > | |
| config_ | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | private |
| createConfigFromMetadata(const PretrainedMetadata &metadata) -> GptConfig | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | inlineprivatestatic |
| createGraph() | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | inlineprivate |
| createOptimizer(const TConfig &config) | Mila::Dnn::Network< TDeviceType, TPrecision > | inline |
| decode(const TokenIndexType &input, int position) override | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | inline |
| Mila::Dnn::LanguageNetwork::decode(const TokenIndexType &input, int position)=0 | Mila::Dnn::LanguageNetwork< TDeviceType, TPrecision > | pure virtual |
| embedding_shape_ | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | private |
| encoder_ | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | private |
| encoder_out_ptr_ | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | private |
| EncoderType typedef | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | |
| ensureBuilt(const char *method) const | Mila::Dnn::Component< TDeviceType, TPrecision > | inlineprivate |
| exec_context_ | Mila::Dnn::Component< TDeviceType, TPrecision > | private |
| final_layernorm_ | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | private |
| findComponent(const std::string &path) const | Mila::Dnn::CompositeComponent< TDeviceType, TPrecision > | inline |
| forward(const TokenIndexType &input) override | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | inline |
| Mila::Dnn::LanguageNetwork::forward(const TokenIndexType &input)=0 | Mila::Dnn::LanguageNetwork< TDeviceType, TPrecision > | pure virtual |
| fromPretrained(const std::filesystem::path &model_path, std::size_t batch_size, std::size_t seq_length, DeviceId device_id=DeviceId{ TDeviceType, 0 }, bool strict=true) | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | inlinestatic |
| getComponent(const std::string &name) const | Mila::Dnn::CompositeComponent< TDeviceType, TPrecision > | inline |
| getComponentAs(const std::string &name) const | Mila::Dnn::CompositeComponent< TDeviceType, TPrecision > | inlineprotected |
| getComponents() const | Mila::Dnn::CompositeComponent< TDeviceType, TPrecision > | inline |
| getDeviceId() const noexcept | Mila::Dnn::Network< TDeviceType, TPrecision > | inlinevirtual |
| getDeviceType() | Mila::Dnn::Component< TDeviceType, TPrecision > | inlinestatic |
| getExecutionContext() const | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | inline |
| getGradients() const override | Mila::Dnn::CompositeComponent< TDeviceType, TPrecision > | inlinevirtual |
| getMemoryStats() const override | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | inlinevirtual |
| getName() const | Mila::Dnn::Component< TDeviceType, TPrecision > | inline |
| getParameterNames() const | Mila::Dnn::Component< TDeviceType, TPrecision > | inlinevirtual |
| getParameters() const override | Mila::Dnn::CompositeComponent< TDeviceType, TPrecision > | inlinevirtual |
| getPrecision() noexcept | Mila::Dnn::Component< TDeviceType, TPrecision > | inlinestatic |
| getRuntimeMode() const noexcept | Mila::Dnn::Component< TDeviceType, TPrecision > | inline |
| getTrainingMode() const noexcept | Mila::Dnn::Component< TDeviceType, TPrecision > | inline |
| getType() const override | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | inlinevirtual |
| GptTransformer(const std::string &name, const GptConfig &config, DeviceId device_id) | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | inlineexplicit |
| hasChildren() const noexcept | Mila::Dnn::CompositeComponent< TDeviceType, TPrecision > | inline |
| hasComponent(const std::string &name) const | Mila::Dnn::CompositeComponent< TDeviceType, TPrecision > | inline |
| hasExecutionContext() const noexcept | Mila::Dnn::Component< TDeviceType, TPrecision > | inlineprotected |
| isBuilt() const final | Mila::Dnn::Component< TDeviceType, TPrecision > | inlinevirtual |
| isIdentifier(const std::string &s) noexcept | Mila::Dnn::Component< TDeviceType, TPrecision > | inlineprivatestatic |
| isInferenceMode() const noexcept | Mila::Dnn::Component< TDeviceType, TPrecision > | inline |
| isTrainingMode() const noexcept | Mila::Dnn::Component< TDeviceType, TPrecision > | inline |
| LanguageNetwork(const std::string &name) | Mila::Dnn::LanguageNetwork< TDeviceType, TPrecision > | inlineexplicit |
| LayerNormType typedef | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | |
| leading_shape_ | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | private |
| LinearType typedef | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | |
| lm_head_ | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | private |
| loadParameter(const std::string &name, const Serialization::ITensorBlob &blob) | Mila::Dnn::Component< TDeviceType, TPrecision > | inlinevirtual |
| loadParameterFromBlob(const std::string ¶m_name, const Serialization::ITensorBlob &blob, Tensor< TParameterPrecision, TMemoryResource > &target, const shape_t &expected_shape) | Mila::Dnn::Component< TDeviceType, TPrecision > | inlineprotected |
| loadParameters(PretrainedModelReader &reader, bool strict) | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | inline |
| logits_ptr_ | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | private |
| MR typedef | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | |
| name_ | Mila::Dnn::Component< TDeviceType, TPrecision > | private |
| Network(const std::string &name) | Mila::Dnn::Network< TDeviceType, TPrecision > | inlineexplicit |
| NetworkBase typedef | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | |
| normalized_ptr_ | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | private |
| onBuilding(const BuildContext &context) override | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | inlineprotectedvirtual |
| onExecutionContextSet() override | Mila::Dnn::CompositeComponent< TDeviceType, TPrecision > | inlineprotectedvirtual |
| onTrainingModeChanging(TrainingMode training_mode) override | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | inlineprotectedvirtual |
| operator=(const CompositeComponent &)=delete | Mila::Dnn::CompositeComponent< TDeviceType, TPrecision > | |
| operator=(CompositeComponent &&) noexcept=default | Mila::Dnn::CompositeComponent< TDeviceType, TPrecision > | |
| optimize() | Mila::Dnn::CompositeComponent< TDeviceType, TPrecision > | inlineprotectedvirtual |
| output_shape_ | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | private |
| owned_context_ | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | private |
| parameterCount() const override | Mila::Dnn::CompositeComponent< TDeviceType, TPrecision > | inlinevirtual |
| parseLayerIndex(const std::string &name) | Mila::Dnn::Network< TDeviceType, TPrecision > | inlineprivate |
| parseParameterPath(const std::string &full_name) const | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | inlineprivate |
| parseTensorName(const std::string &tensor_name) | Mila::Dnn::Network< TDeviceType, TPrecision > | inlineprivate |
| prefill(const TokenIndexType &input) override | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | inline |
| Mila::Dnn::LanguageNetwork::prefill(const TokenIndexType &input)=0 | Mila::Dnn::LanguageNetwork< TDeviceType, TPrecision > | pure virtual |
| removeComponent(const std::string &name) | Mila::Dnn::CompositeComponent< TDeviceType, TPrecision > | inline |
| save(ModelArchive &archive, SerializationMode mode) const | Mila::Dnn::Network< TDeviceType, TPrecision > | inline |
| save_(ModelArchive &archive, SerializationMode) const override | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | inlineprotectedvirtual |
| saveComponentGraph(ModelArchive &archive, SerializationMode mode) const | Mila::Dnn::Network< TDeviceType, TPrecision > | inlineprivate |
| saveNetworkMetadata(ModelArchive &archive, SerializationMode mode) const | Mila::Dnn::Network< TDeviceType, TPrecision > | inlineprivate |
| seq_length_ | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | private |
| setExecutionContext(IExecutionContext *context) | Mila::Dnn::Component< TDeviceType, TPrecision > | inlineprotected |
| setTrainingMode(TrainingMode mode) | Mila::Dnn::Component< TDeviceType, TPrecision > | inline |
| synchronize() override | Mila::Dnn::Network< TDeviceType, TPrecision > | inlinevirtual |
| TensorType typedef | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | |
| TokenIndexType typedef | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | |
| toString() const override | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | inlinevirtual |
| training_mode_ | Mila::Dnn::Component< TDeviceType, TPrecision > | private |
| training_mode_mutex_ | Mila::Dnn::Component< TDeviceType, TPrecision > | private |
| transformer_blocks_ | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | private |
| TransformerBlockType typedef | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | |
| tryFindComponent(const std::string &path) const | Mila::Dnn::CompositeComponent< TDeviceType, TPrecision > | inline |
| validateBuildContext(const BuildContext &context) const | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | inlineprivate |
| validateInputShape(const shape_t &input_shape) const | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | inlineprivate |
| validateName(const std::string &name) | Mila::Dnn::Component< TDeviceType, TPrecision > | inlineprivatestatic |
| verifyArchitectureCompatibility(const PretrainedMetadata &metadata) | Mila::Dnn::Network< TDeviceType, TPrecision > | inlineprotected |
| zeroGradients() override | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | inlinevirtual |
| ~Component()=default | Mila::Dnn::Component< TDeviceType, TPrecision > | virtual |
| ~CompositeComponent()=default | Mila::Dnn::CompositeComponent< TDeviceType, TPrecision > | virtual |
| ~GptTransformer() override=default | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > | |
| ~LanguageNetwork() override=default | Mila::Dnn::LanguageNetwork< TDeviceType, TPrecision > | |
| ~Network() override=default | Mila::Dnn::Network< TDeviceType, TPrecision > | |