Mila
Deep Neural Network Library
|
Implementation of the CUDA-based Encoder operation for transformer models. More...
#include <cuda_fp16.h>
#include <vector>
#include <memory>
#include <string>
#include <stdexcept>
#include "Kernels/CudaOps.h"
import Compute.CudaDevice;
import Compute.CudaMemoryResource;
import Dnn.Modules.Encoder;
import Dnn.Tensor;
import Dnn.TensorTraits;
import Compute.Precision;
import Dnn.ComponentConfig;
import Compute.OperationBase;
import Compute.UnaryOperation;
import Compute.OperationRegistry;
import Compute.OperationType;
import Compute.DeviceType;
import Compute.DeviceContext;
import Compute.OperationAttributes;
import Compute.MemoryResource;
Classes | |
struct | Mila::Dnn::Compute::Detail::cuda_encoder_impl< float > |
Single-precision (float) specialization for CUDA encoder operations. More... | |
struct | Mila::Dnn::Compute::Detail::cuda_encoder_impl< half > |
Half-precision (half) specialization for CUDA encoder operations. More... | |
class | Mila::Dnn::Compute::CudaEncoderOp< TInput, TOutput > |
CUDA implementation of the Encoder operation for transformer models. More... | |
class | Mila::Dnn::Compute::CudaEncoderOpRegistrar |
Class responsible for registering the CudaEncoderOp operation. More... | |
Namespaces | |
namespace | Mila |
namespace | Mila::Dnn |
namespace | Mila::Dnn::Compute |
namespace | Mila::Dnn::Compute::Detail |
Namespace for CUDA layer normalization implementation details. | |
Implementation of the CUDA-based Encoder operation for transformer models.