Mila 0.13.48
Deep Neural Network Library
Loading...
Searching...
No Matches
GptTransformer.ixx File Reference
#include <string>
#include <vector>
#include <memory>
#include <sstream>
#include <type_traits>
#include <stdexcept>
#include <cstdint>
#include <cstring>
#include <ostream>
#include <iostream>
#include <filesystem>
#include <format>
#include <optional>
#include <cassert>
#include <random>
#include <chrono>
#include <algorithm>
#include <numeric>
import Logging.Logger;
import Serialization.Tensor;
import Serialization.Mode;
import Serialization.ModelArchive;
import Compute.ExecutionContextFactory;
import Compute.CpuMemoryResource;
import Compute.DeviceType;
import Compute.Device;
import Dnn.ActivationType;
import Dnn.ComponentType;
import Dnn.Tensor;
import Dnn.ITensor;
import Dnn.Components.Lpe;
import Serialization.PretrainedReader;
import Compute.ExecutionContext;
import Dnn.Components.GptBlock;
import Dnn.TensorTypes;
import Dnn.TensorDataType;
import Dnn.Components.GptTransformer:Presets;
import Dnn.Components.Linear;
import Dnn.TensorDataTypeTraits;
import Dnn.RuntimeMode;
import Dnn.LanguageNetwork;
import Dnn.Component;
import Compute.DeviceTypeTraits;
import Compute.DeviceId;
import Dnn.Components.LayerNorm;

Classes

class  Mila::Dnn::GptTransformer< TDeviceType, TPrecision >
 GPT-2 style transformer (decoder-only) for autoregressive token prediction. More...

Namespaces

namespace  Mila
 Mila main API namespace.
namespace  Mila::Dnn