| Base typedef | Mila::Dnn::LanguageModel< TDeviceType, TPrecision > | |
| config_ | Mila::Dnn::GptModel< TDeviceType, TPrecision > | private |
| configFromMetadata(const PretrainedMetadata &metadata) | Mila::Dnn::GptModel< TDeviceType, TPrecision > | inlineprivatestatic |
| ensureTrainingMode(const char *method) const | Mila::Dnn::Model< TDeviceType, TPrecision > | inlineprivate |
| eos_token_ | Mila::Dnn::GptModel< TDeviceType, TPrecision > | privatestatic |
| eosToken() const noexcept override | Mila::Dnn::GptModel< TDeviceType, TPrecision > | inlineprotectedvirtual |
| fromCheckpoint(const std::filesystem::path &path, DeviceId device_id=DeviceId{ TDeviceType, 0 }) | Mila::Dnn::GptModel< TDeviceType, TPrecision > | inlinestatic |
| fromPretrained(const std::filesystem::path &path, dim_t context_length, DeviceId device_id=DeviceId{ TDeviceType, 0 }, bool strict=true) | Mila::Dnn::GptModel< TDeviceType, TPrecision > | inlinestatic |
| generate(const std::vector< int32_t > &prompt_tokens, size_t max_new_tokens=64, float temperature=1.0f, int top_k=0) | Mila::Dnn::LanguageModel< TDeviceType, TPrecision > | inline |
| generateStreaming(const std::vector< int32_t > &prompt_tokens, std::function< void(int32_t)> on_token, size_t max_new_tokens=64, float temperature=1.0f, int top_k=0, std::stop_token stop={}) | Mila::Dnn::LanguageModel< TDeviceType, TPrecision > | inline |
| getConfig() const noexcept | Mila::Dnn::GptModel< TDeviceType, TPrecision > | inline |
| getDeviceId() const noexcept | Mila::Dnn::Model< TDeviceType, TPrecision > | inline |
| getLanguageNetwork() noexcept | Mila::Dnn::LanguageModel< TDeviceType, TPrecision > | inlineprotected |
| getLanguageNetwork() const noexcept | Mila::Dnn::LanguageModel< TDeviceType, TPrecision > | inlineprotected |
| getLastGenerationStatistics() const noexcept | Mila::Dnn::LanguageModel< TDeviceType, TPrecision > | inline |
| getMemoryStats() const | Mila::Dnn::Model< TDeviceType, TPrecision > | inline |
| getRuntimeMode() const noexcept | Mila::Dnn::Model< TDeviceType, TPrecision > | inline |
| GptModel(const GptModel &)=delete | Mila::Dnn::GptModel< TDeviceType, TPrecision > | |
| GptModel(GptModel &&)=default | Mila::Dnn::GptModel< TDeviceType, TPrecision > | |
| GptModel(std::unique_ptr< GptTransformerType > network, const GptConfig &config, RuntimeMode runtime_mode) | Mila::Dnn::GptModel< TDeviceType, TPrecision > | inlineexplicitprivate |
| GptModel(std::unique_ptr< GptTransformerType > network, const GptConfig &config) | Mila::Dnn::GptModel< TDeviceType, TPrecision > | inlineexplicitprivate |
| GptTransformerType typedef | Mila::Dnn::GptModel< TDeviceType, TPrecision > | |
| isEval() const noexcept | Mila::Dnn::Model< TDeviceType, TPrecision > | inline |
| isInferenceMode() const noexcept | Mila::Dnn::Model< TDeviceType, TPrecision > | inline |
| isTrainingMode() const noexcept | Mila::Dnn::Model< TDeviceType, TPrecision > | inline |
| LanguageModel(const LanguageModel &)=delete | Mila::Dnn::LanguageModel< TDeviceType, TPrecision > | |
| LanguageModel(LanguageModel &&)=default | Mila::Dnn::LanguageModel< TDeviceType, TPrecision > | |
| LanguageModel(std::unique_ptr< LanguageNetwork< TDeviceType, TPrecision > > network, RuntimeMode runtime_mode) | Mila::Dnn::LanguageModel< TDeviceType, TPrecision > | inlineexplicitprotected |
| last_generation_statistics_ | Mila::Dnn::LanguageModel< TDeviceType, TPrecision > | protected |
| makeTokenTensor(const std::vector< int32_t > &token_ids) const | Mila::Dnn::GptModel< TDeviceType, TPrecision > | inlineprivate |
| maxSequenceLength() const noexcept override | Mila::Dnn::GptModel< TDeviceType, TPrecision > | inlineprotectedvirtual |
| Model(const Model &)=delete | Mila::Dnn::Model< TDeviceType, TPrecision > | |
| Model(Model &&)=default | Mila::Dnn::Model< TDeviceType, TPrecision > | |
| Model(std::unique_ptr< NetworkType > network, RuntimeMode runtime_mode) | Mila::Dnn::Model< TDeviceType, TPrecision > | inlineexplicitprotected |
| ModelBase typedef | Mila::Dnn::GptModel< TDeviceType, TPrecision > | |
| MR typedef | Mila::Dnn::GptModel< TDeviceType, TPrecision > | |
| network_ | Mila::Dnn::Model< TDeviceType, TPrecision > | protected |
| NetworkType typedef | Mila::Dnn::Model< TDeviceType, TPrecision > | |
| onGenerating(const std::vector< int32_t > &prompt_tokens, const std::function< void(int32_t)> &on_token, size_t max_new_tokens, float temperature, int top_k, std::stop_token stop) override | Mila::Dnn::GptModel< TDeviceType, TPrecision > | inlineprotectedvirtual |
| onTraining() override | Mila::Dnn::GptModel< TDeviceType, TPrecision > | inlineprotectedvirtual |
| operator=(const GptModel &)=delete | Mila::Dnn::GptModel< TDeviceType, TPrecision > | |
| operator=(GptModel &&)=default | Mila::Dnn::GptModel< TDeviceType, TPrecision > | |
| Mila::Dnn::LanguageModel::operator=(const LanguageModel &)=delete | Mila::Dnn::LanguageModel< TDeviceType, TPrecision > | |
| Mila::Dnn::LanguageModel::operator=(LanguageModel &&)=default | Mila::Dnn::LanguageModel< TDeviceType, TPrecision > | |
| Mila::Dnn::Model::operator=(const Model &)=delete | Mila::Dnn::Model< TDeviceType, TPrecision > | |
| Mila::Dnn::Model::operator=(Model &&)=default | Mila::Dnn::Model< TDeviceType, TPrecision > | |
| runtime_mode_ | Mila::Dnn::Model< TDeviceType, TPrecision > | private |
| sampleFromLogits(const TensorType &logits, int64_t position, float temperature, int top_k, std::mt19937 &rng) const | Mila::Dnn::GptModel< TDeviceType, TPrecision > | inlineprivate |
| sampleToken(const float *logits, size_t vocab_size, float temperature, int top_k, std::mt19937 &rng) | Mila::Dnn::GptModel< TDeviceType, TPrecision > | inlineprivatestatic |
| setEval(bool eval) | Mila::Dnn::Model< TDeviceType, TPrecision > | inline |
| stopTokens() const | Mila::Dnn::LanguageModel< TDeviceType, TPrecision > | inlineprotectedvirtual |
| TensorType typedef | Mila::Dnn::GptModel< TDeviceType, TPrecision > | |
| TokenIndexType typedef | Mila::Dnn::GptModel< TDeviceType, TPrecision > | |
| toString() const override | Mila::Dnn::GptModel< TDeviceType, TPrecision > | inlinevirtual |
| train() | Mila::Dnn::Model< TDeviceType, TPrecision > | inline |
| truncateIfNeeded(std::vector< int32_t > &tokens) const | Mila::Dnn::GptModel< TDeviceType, TPrecision > | inlineprivate |
| vocabSize() const noexcept override | Mila::Dnn::GptModel< TDeviceType, TPrecision > | inlineprotectedvirtual |
| ~GptModel()=default | Mila::Dnn::GptModel< TDeviceType, TPrecision > | |
| ~LanguageModel()=default | Mila::Dnn::LanguageModel< TDeviceType, TPrecision > | virtual |
| ~Model()=default | Mila::Dnn::Model< TDeviceType, TPrecision > | virtual |