mycaffe/html/_my_caffe_8layers_8gpt_2_layer_factory_8cs_source.html

using System;

using System.Collections.Generic;

using System.Linq;

using System.Text;

using System.Threading.Tasks;

using MyCaffe.basecode;

using MyCaffe.common;

using MyCaffe.db.image;

using MyCaffe.param;


namespace MyCaffe.layers.gpt

{

    public class LayerFactory : ILayerCreator

    {

        public Layer<double> CreateDouble(CudaDnn<double> cuda, Log log, LayerParameter p, CancelEvent evtCancel, IXDatabaseBase db)

        {

            switch (p.type)

            {

                case LayerParameter.LayerType.CAUSAL_SELF_ATTENTION:

                    return new CausalSelfAttentionLayer<double>(cuda, log, p);


                case LayerParameter.LayerType.MULTIHEAD_ATTENTION:

                    return new MultiheadAttentionLayer<double>(cuda, log, p);


                case LayerParameter.LayerType.POSITIONAL_ENCODER:

                    return new PositionalEncodingLayer<double>(cuda, log, p);


                case LayerParameter.LayerType.GELU:

                    return new GeluLayer<double>(cuda, log, p);


                case LayerParameter.LayerType.LAYERNORM:

                    return new LayerNormLayer<double>(cuda, log, p);


                case LayerParameter.LayerType.TRANSFORMER_BLOCK:

                    return new TransformerBlockLayer<double>(cuda, log, p);


                case LayerParameter.LayerType.TOKENIZED_DATA:

                    return new TokenizedDataLayer<double>(cuda, log, p, db, evtCancel);


                case LayerParameter.LayerType.TOKENIZED_DATA_PAIRS:

                    return new TokenizedDataPairsLayer<double>(cuda, log, p, db, evtCancel);


                case LayerParameter.LayerType.NLL_LOSS:

                    return new NLLLossLayer<double>(cuda, log, p);


                default:

                    return null;

            }

        }


        public Layer<float> CreateSingle(CudaDnn<float> cuda, Log log, LayerParameter p, CancelEvent evtCancel, IXDatabaseBase db)

        {

            switch (p.type)

            {

                case LayerParameter.LayerType.CAUSAL_SELF_ATTENTION:

                    return new CausalSelfAttentionLayer<float>(cuda, log, p);


                case LayerParameter.LayerType.MULTIHEAD_ATTENTION:

                    return new MultiheadAttentionLayer<float>(cuda, log, p);


                case LayerParameter.LayerType.POSITIONAL_ENCODER:

                    return new PositionalEncodingLayer<float>(cuda, log, p);


                case LayerParameter.LayerType.GELU:

                    return new GeluLayer<float>(cuda, log, p);


                case LayerParameter.LayerType.LAYERNORM:

                    return new LayerNormLayer<float>(cuda, log, p);


                case LayerParameter.LayerType.TRANSFORMER_BLOCK:

                    return new TransformerBlockLayer<float>(cuda, log, p);


                case LayerParameter.LayerType.TOKENIZED_DATA:

                    return new TokenizedDataLayer<float>(cuda, log, p, db, evtCancel);


                case LayerParameter.LayerType.TOKENIZED_DATA_PAIRS:

                    return new TokenizedDataPairsLayer<float>(cuda, log, p, db, evtCancel);


                case LayerParameter.LayerType.NLL_LOSS:

                    return new NLLLossLayer<float>(cuda, log, p);


                default:

                    return null;

            }

        }

    }

}

MyCaffe.basecode.CancelEvent
The CancelEvent provides an extension to the manual cancel event that allows for overriding the manua...
Definition: CancelEvent.cs:17

MyCaffe.basecode.Log
The Log class provides general output in text form.
Definition: Log.cs:13

MyCaffe.common.CudaDnn
The CudaDnn object is the main interface to the Low-Level Cuda C++ DLL.
Definition: CudaDnn.cs:969

MyCaffe.layers.Layer
An interface for the units of computation which can be composed into a Net.
Definition: Layer.cs:31

MyCaffe.layers.gpt.CausalSelfAttentionLayer
The CausalSelfAttention provides a vanilla multi-head self-attention layer with projection at the end...
Definition: CausalSelfAttentionLayer.cs:21

MyCaffe.layers.gpt.GeluLayer
The GeluLayer implements the New GELU activation function currently in Google BERT repo (same as Open...
Definition: GeluLayer.cs:24

MyCaffe.layers.gpt.LayerFactory
The LayerFactor is responsible for creating all layers implemented in the MyCaffe....
Definition: LayerFactory.cs:20

MyCaffe.layers.gpt.LayerFactory.CreateSingle
Layer< float > CreateSingle(CudaDnn< float > cuda, Log log, LayerParameter p, CancelEvent evtCancel, IXDatabaseBase db)
Create the layers when using the float base type.
Definition: LayerFactory.cs:75

MyCaffe.layers.gpt.LayerFactory.CreateDouble
Layer< double > CreateDouble(CudaDnn< double > cuda, Log log, LayerParameter p, CancelEvent evtCancel, IXDatabaseBase db)
Create the layers when using the double base type.
Definition: LayerFactory.cs:30

MyCaffe.layers.gpt.LayerNormLayer
The LayerNormalizationLayer performs layer normalization similar to the PyTorch LayerNorm layer.
Definition: LayerNormLayer.cs:23

MyCaffe.layers.gpt.MultiheadAttentionLayer
The MultiheadAttention provides a vanilla multi-head layer.
Definition: MultiheadAttentionLayer.cs:23

MyCaffe.layers.gpt.NLLLossLayer
Computes the nll loss for a one-of-many classification task, passing real-valued predictions (from a ...
Definition: NLLLossLayer.cs:23

MyCaffe.layers.gpt.PositionalEncodingLayer
The PositionalEncodingLayer is a neuron layer that adds positional encoding to the input.
Definition: PositionalEncodingLayer.cs:20

MyCaffe.layers.gpt.TokenizedDataLayer
The TokenizedDataLayer loads and tokenizes data for a transformer model where data is loaded in the f...
Definition: TokenizedDataLayer.cs:21

MyCaffe.layers.gpt.TokenizedDataPairsLayer
The TokenizedDataPairsLayer loads and tokenizes data for a transformer model where data is loaded in ...
Definition: TokenizedDataPairsLayer.cs:28

MyCaffe.layers.gpt.TransformerBlockLayer
The TransformerBlock provides a generic transformer block
Definition: TransformerBlockLayer.cs:24

MyCaffe.param.LayerParameter
Specifies the base parameter for all layers.
Definition: LayerParameter.cs:24

MyCaffe.param.LayerParameter.type
LayerType type
Specifies the type of this LayerParameter.
Definition: LayerParameter.cs:1874

MyCaffe.param.LayerParameter.LayerType
LayerType
Specifies the layer type.
Definition: LayerParameter.cs:110

MyCaffe.ILayerCreator
The ILayerCreator interface is implemented by each MyCaffe.layers.x layer extension dll and is used t...
Definition: Interfaces.cs:19

MyCaffe.basecode.IXDatabaseBase
The IXDatabaseBase interface defines the general interface to the in-memory database.
Definition: Interfaces.cs:444

MyCaffe.basecode
The MyCaffe.basecode contains all generic types used throughout MyCaffe.
Definition: Annotation.cs:12

MyCaffe.common
The MyCaffe.common namespace contains common MyCaffe classes.
Definition: BatchInput.cs:8

MyCaffe.db.image
The MyCaffe.db.image namespace contains all image database related classes.
Definition: Database.cs:18

MyCaffe.db
Definition: Database.cs:18

MyCaffe.layers.gpt
The MyCaffe.layers.gpt namespace contains all GPT related layers.
Definition: LayerFactory.cs:15

MyCaffe.param
The MyCaffe.param namespace contains parameters used to create models.
Definition: AttentionParameter.cs:9

MyCaffe
The MyCaffe namespace contains the main body of MyCaffe code that closesly tracks the C++ Caffe open-...
Definition: Annotation.cs:12

System
Definition: Component.cs:11