|
Mila 0.13.48
Deep Neural Network Library
|
#include <string>#include <vector>#include <memory>#include <sstream>#include <type_traits>#include <stdexcept>#include <cstdint>#include <cstring>#include <ostream>#include <iostream>#include <filesystem>#include <format>#include <optional>#include <cassert>#include <random>#include <chrono>#include <algorithm>#include <numeric>import Logging.Logger;import Serialization.Tensor;import Serialization.Mode;import Serialization.ModelArchive;import Compute.ExecutionContextFactory;import Compute.CpuMemoryResource;import Compute.DeviceType;import Compute.Device;import Dnn.ActivationType;import Dnn.ComponentType;import Dnn.Tensor;import Dnn.ITensor;import Dnn.Components.Lpe;import Serialization.PretrainedReader;import Compute.ExecutionContext;import Dnn.Components.GptBlock;import Dnn.TensorTypes;import Dnn.TensorDataType;import Dnn.Components.GptTransformer:Presets;import Dnn.Components.Linear;import Dnn.TensorDataTypeTraits;import Dnn.RuntimeMode;import Dnn.LanguageNetwork;import Dnn.Component;import Compute.DeviceTypeTraits;import Compute.DeviceId;import Dnn.Components.LayerNorm;Classes | |
| class | Mila::Dnn::GptTransformer< TDeviceType, TPrecision > |
| GPT-2 style transformer (decoder-only) for autoregressive token prediction. More... | |
Namespaces | |
| namespace | Mila |
| Mila main API namespace. | |
| namespace | Mila::Dnn |