mycaffe/html/_var_sel_net_layer_8cs_source.html

using System;

using System.Collections.Generic;

using System.Diagnostics;

using System.Linq;

using System.Net.Http.Headers;

using System.Reflection;

using System.Text;

using MyCaffe.basecode;

using MyCaffe.common;

using MyCaffe.param;


namespace MyCaffe.layers.tft

{

    public class VarSetNetLayer<T> : Layer<T>

    {

        Layer<T> m_grnFlatten;

        Blob<T> m_blobSparseWts;

        Layer<T> m_softmax;

        Blob<T> m_blobSparseWtsSmx;

        Layer<T> m_transpose;

        Blob<T> m_blobSparseWtsSmxT;

        Blob<T> m_blobGrn1;

        Blob<T> m_blobProcessedInputs;

        Blob<T> m_blobProcessedInputsT;

        Blob<T> m_blobProcessedInputs1;

        Blob<T> m_blobBtm;

        List<Layer<T>> m_rgSingleVarGrn = new List<Layer<T>>();

        BlobCollection<T> m_colSingleVarGrn = new BlobCollection<T>();

        BlobCollection<T> m_colTop = new BlobCollection<T>();

        BlobCollection<T> m_colBtm = new BlobCollection<T>();

        List<int> m_rgShape = new List<int>(4);

        List<int> m_rgShapeOringal = new List<int>(4);


        public VarSetNetLayer(CudaDnn<T> cuda, Log log, LayerParameter p)

            : base(cuda, log, p)

        {

            m_type = LayerParameter.LayerType.VARSELNET;


            m_blobSparseWts = new Blob<T>(cuda, log);

            m_blobSparseWts.Name = p.name + ".spwts";

            m_blobSparseWtsSmx = new Blob<T>(cuda, log);

            m_blobSparseWtsSmx.Name = p.name + ".spwts_smx";

            m_blobSparseWtsSmxT = new Blob<T>(cuda, log);

            m_blobSparseWtsSmxT.Name = p.name + ".spwts_smxT";

            m_blobGrn1 = new Blob<T>(cuda, log);

            m_blobGrn1.Name = p.name + ".grn1";

            m_blobProcessedInputs = new Blob<T>(cuda, log);

            m_blobProcessedInputs.Name = p.name + ".proc_in";

            m_blobProcessedInputsT = new Blob<T>(cuda, log);

            m_blobProcessedInputsT.Name = p.name + ".proc_inT";

            m_blobProcessedInputs1 = new Blob<T>(cuda, log);

            m_blobProcessedInputs1.Name = p.name + ".proc_in1";

            m_blobBtm = new Blob<T>(cuda, log);

            m_blobBtm.Name = p.name + ".btm";

        }


        protected override void dispose()

        {

            dispose(ref m_blobSparseWts);

            dispose(ref m_blobSparseWtsSmx);

            dispose(ref m_blobSparseWtsSmxT);

            dispose(ref m_blobGrn1);

            dispose(ref m_blobProcessedInputs);

            dispose(ref m_blobProcessedInputsT);

            dispose(ref m_blobProcessedInputs1);

            dispose(ref m_blobBtm);


            if (m_colSingleVarGrn != null)

            {

                m_colSingleVarGrn.Dispose();

                m_colSingleVarGrn = null;

            }


            dispose(ref m_grnFlatten);


            if (m_rgSingleVarGrn != null)

            {

                foreach (Layer<T> layer in m_rgSingleVarGrn)

                {

                    layer.Dispose();

                }

                m_rgSingleVarGrn = null;

            }

        }


        protected override void setup_internal_blobs(BlobCollection<T> col)

        {

            if (col.Count > 0)

                return;


            col.Add(m_blobSparseWts);

            col.Add(m_blobSparseWtsSmx);

            col.Add(m_blobSparseWtsSmxT);

            col.Add(m_blobGrn1);

            col.Add(m_blobProcessedInputs);

            col.Add(m_blobProcessedInputsT);

            col.Add(m_blobProcessedInputs1);

            col.Add(m_blobBtm);

        }


        public override int MinBottomBlobs

        {

            get { return 1; }

        }


        public override int MaxBottomBlobs

        {

            get { return 2; }

        }


        public override int MinTopBlobs

        {

            get { return 1; }

        }


        public override int MaxTopBlobs

        {

            get { return 2; }

        }


        private void addBtmTop(Blob<T> btm, Blob<T> top)

        {

            m_colBtm.Clear();

            m_colBtm.Add(btm);

            m_colTop.Clear();

            m_colTop.Add(top);

        }


        public override void LayerSetUp(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            List<int> rgShape = new List<int>();

            Blob<T> blobStaticSelection = null;


            if (colBottom.Count > 1)

                blobStaticSelection = colBottom[1];


            // This GRN is applied on the flat concatenation of the input representation (all inputs together),

            // possibly provided with context information.

            if (m_grnFlatten == null)

            {

                LayerParameter p = new LayerParameter(LayerParameter.LayerType.GRN, m_param.name + ".flat");

                p.grn_param.axis = m_param.varselnet_param.axis;

                p.grn_param.batch_first = m_param.varselnet_param.batch_first;

                p.grn_param.bias_filler = m_param.varselnet_param.bias_filler;

                p.grn_param.weight_filler = m_param.varselnet_param.weight_filler;

                p.grn_param.input_dim = m_param.varselnet_param.num_inputs * m_param.varselnet_param.input_dim;

                p.grn_param.hidden_dim = m_param.varselnet_param.hidden_dim;

                p.grn_param.output_dim = m_param.varselnet_param.num_inputs;

                p.grn_param.context_dim = m_param.varselnet_param.context_dim;

                m_grnFlatten = Layer<T>.Create(m_cuda, m_log, convertLayerParam(p, m_param), null);


                addBtmTop(colBottom[0], m_blobSparseWts);

                if (blobStaticSelection != null)

                    m_colBtm.Add(blobStaticSelection);

                m_grnFlatten.Setup(m_colBtm, m_colTop);

                blobs.Add(m_grnFlatten.blobs);

            }


            // Activation for transforming the GRN output to weights.

            if (m_softmax == null)

            {

                LayerParameter p = new LayerParameter(LayerParameter.LayerType.SOFTMAX, m_param.name + ".smx");

                p.softmax_param.axis = m_param.varselnet_param.axis;

                p.softmax_param.engine = EngineParameter.Engine.DEFAULT;

                m_softmax = Layer<T>.Create(m_cuda, m_log, convertLayerParam(p, m_param), null);


                addBtmTop(m_blobSparseWts, m_blobSparseWtsSmx);

                m_softmax.Setup(m_colBtm, m_colTop);

            }


            rgShape = Utility.Clone<int>(m_blobSparseWtsSmx.shape());

            rgShape.Add(1);

            rgShape.Add(1);

            m_blobSparseWtsSmx.Reshape(rgShape);


            // Setup transpose applied to smx.

            if (m_transpose == null)

            {

                LayerParameter p = new LayerParameter(LayerParameter.LayerType.TRANSPOSE, m_param.name + ".trfm");

                p.transpose_param.dim[1] = 2;

                p.transpose_param.dim[2] = 1;

                m_transpose = Layer<T>.Create(m_cuda, m_log, convertLayerParam(p, m_param), null);


                addBtmTop(m_blobSparseWtsSmx, m_blobSparseWtsSmxT);

                m_transpose.Setup(m_colBtm, m_colTop);

            }


            // Each input variable (after transformation into its wide represenation) goes through its own GRN

            rgShape.Clear();

            rgShape.Add(colBottom[0].num);

            rgShape.Add(colBottom[0].channels / m_param.varselnet_param.num_inputs);

            m_blobGrn1.Reshape(rgShape);


            if (m_rgSingleVarGrn.Count < m_param.varselnet_param.num_inputs)

            {

                for (int i = 0; i < m_param.varselnet_param.num_inputs; i++)

                {

                    LayerParameter p = new LayerParameter(LayerParameter.LayerType.GRN, m_param.name + ".grn" + i.ToString());

                    p.grn_param.axis = m_param.varselnet_param.axis;

                    p.grn_param.batch_first = m_param.varselnet_param.batch_first;

                    p.grn_param.bias_filler = m_param.varselnet_param.bias_filler;

                    p.grn_param.weight_filler = m_param.varselnet_param.weight_filler;

                    p.grn_param.input_dim = m_param.varselnet_param.input_dim;

                    p.grn_param.hidden_dim = m_param.varselnet_param.hidden_dim;

                    p.grn_param.output_dim = m_param.varselnet_param.hidden_dim;

                    p.grn_param.dropout_ratio = m_param.varselnet_param.dropout_ratio;

                    Layer<T> grn = Layer<T>.Create(m_cuda, m_log, convertLayerParam(p, m_param), null);


                    Blob<T> blobGrn = new Blob<T>(m_cuda, m_log);

                    blobGrn.ReshapeLike(m_blobGrn1);


                    m_rgSingleVarGrn.Add(grn);

                    m_colSingleVarGrn.Add(blobGrn);


                    addBtmTop(m_blobGrn1, m_colSingleVarGrn[i]);

                    m_rgSingleVarGrn[i].Setup(m_colBtm, m_colTop);

                    blobs.Add(grn.blobs);

                }

            }


            rgShape.Clear();

            rgShape.Add(colBottom[0].num);

            rgShape.Add(colBottom[0].channels / m_param.varselnet_param.num_inputs);

            rgShape.Add(m_param.varselnet_param.num_inputs);

            m_blobProcessedInputs.Reshape(rgShape);

            m_blobProcessedInputs1.Reshape(rgShape);

        }


        public override void Reshape(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            List<int> rgShape;

            Blob<T> blobStaticSelection = null;


            if (colBottom.Count > 1)

                blobStaticSelection = colBottom[1];


            m_blobBtm.ReshapeLike(colBottom[0]);


            m_rgShape.Clear();

            m_rgShapeOringal.Clear();


            addBtmTop(colBottom[0], m_blobSparseWts);

            if (colBottom.Count > 1)

                m_colBtm.Add(blobStaticSelection);

            m_grnFlatten.Reshape(m_colBtm, m_colTop);


            addBtmTop(m_blobSparseWts, m_blobSparseWtsSmx);

            m_softmax.Reshape(m_colBtm, m_colTop);


            rgShape = Utility.Clone<int>(m_blobSparseWtsSmx.shape());

            rgShape.Add(1);

            rgShape.Add(1);

            m_blobSparseWtsSmx.Reshape(rgShape);


            addBtmTop(m_blobSparseWtsSmx, m_blobSparseWtsSmxT);

            m_transpose.Reshape(m_colBtm, m_colTop);


            rgShape.Clear();

            rgShape.Add(colBottom[0].num);

            rgShape.Add(colBottom[0].channels / m_param.varselnet_param.num_inputs);

            m_blobGrn1.Reshape(rgShape);


            for (int i = 0; i < m_param.varselnet_param.num_inputs; i++)

            {

                m_colSingleVarGrn[i].ReshapeLike(m_blobGrn1);


                addBtmTop(m_blobGrn1, m_colSingleVarGrn[i]);

                m_rgSingleVarGrn[i].Reshape(m_colBtm, m_colTop);

            }


            rgShape = Utility.Clone<int>(m_colSingleVarGrn[0].shape());

            rgShape.Add(m_param.varselnet_param.num_inputs);

            m_blobProcessedInputs.Reshape(rgShape);

            m_blobProcessedInputs1.Reshape(rgShape);


            colTop[0].ReshapeLike(m_colSingleVarGrn[0]);

            if (colTop.Count > 1)

            {

                colTop[1].ReshapeLike(m_blobSparseWts);

                colTop[1].type = BLOB_TYPE.WEIGHT;

            }

        }


        protected override void forward(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            m_blobBtm.CopyFrom(colBottom[0]);

            Blob<T> blobStaticSelection = null;


            if (colBottom.Count > 1)

                blobStaticSelection = colBottom[1];


            // Infer variable selection weights using flattened embedding run through GRN.  The flattened embedding

            // should have shape [(num_samples * num_temporal_steps) x (num_inputs x input_dim)] where the

            // input_dim represents the model_dim or the state_dim.  With static variable selection, num_temporal_Steps

            // is set to 1.

            addBtmTop(colBottom[0], m_blobSparseWts);

            if (colBottom.Count > 1)

                m_colBtm.Add(blobStaticSelection);

            m_grnFlatten.Forward(m_colBtm, m_colTop);


            // Sparse weights are of shape [(num_samples * num_temporal_steps) x num_inputs x 1]

            addBtmTop(m_blobSparseWts, m_blobSparseWtsSmx);

            m_softmax.Forward(m_colBtm, m_colTop);


            // Unsqueeze by 2

            List<int> rgShape = Utility.Clone<int>(m_blobSparseWtsSmx.shape());

            rgShape.Add(1);

            rgShape.Add(1);

            m_blobSparseWtsSmx.Reshape(rgShape);


            // Before weighting the variables, a GRN is applied ot each transformed input.

            for (int i = 0; i < m_param.varselnet_param.num_inputs; i++)

            {

                // Copy the variable specific data to the GRN input.

                m_cuda.channel_copy(m_blobGrn1.count(), m_blobGrn1.num, 1, m_param.varselnet_param.num_inputs, m_blobGrn1.channels, i, colBottom[0].gpu_data, m_blobGrn1.mutable_gpu_data, DIR.FWD);


                // Each element in the resulting list is of size [(num_samples * num_temporal_steps) x state_size],

                // and each element corresponds to a single input variable.

                addBtmTop(m_blobGrn1, m_colSingleVarGrn[i]);

                m_rgSingleVarGrn[i].Forward(m_colBtm, m_colTop);


                // Combine the outputs of the state var GRNs along an additional axis with

                // dimension [(num_samples * num_temporal_steps) x state_size x num_inputs]

                m_cuda.channel_copy(m_blobGrn1.count(), m_blobGrn1.num, m_blobGrn1.channels, m_param.varselnet_param.num_inputs, 1, i, m_blobProcessedInputs.mutable_gpu_data, m_colSingleVarGrn[i].gpu_data, DIR.BWD);

            }


            // Weigh the processed inputs with the weights viewed as [(num_samples * num_temporal_steps) x 1 x num_inputs]

            // so that the weight given to each variable (for each time-step/observation) multiplies the entire state

            // vector representing the specific input variable on the specific time-step

            addBtmTop(m_blobSparseWtsSmx, m_blobSparseWtsSmxT);

            m_transpose.Forward(m_colBtm, m_colTop);


            // Apply the transposed smx weightings to the processed inputs

            int nInnerNum = m_blobProcessedInputs.count(2);

            m_cuda.channel_mulv(m_blobProcessedInputs.count(), m_blobProcessedInputs.num, m_blobProcessedInputs.channels, nInnerNum, m_blobProcessedInputs.gpu_data, m_blobSparseWtsSmxT.gpu_data, m_blobProcessedInputs1.mutable_gpu_data);


            // Sum up the weights to create a weighted sum representation of width state_size for each time-step and

            // dimension [(num_samples * num_temporal_steps) x state_size x num_inputs]

            m_cuda.channel_sum(m_blobProcessedInputs1.count(), m_blobProcessedInputs1.num, m_blobProcessedInputs1.channels, nInnerNum, m_blobProcessedInputs1.gpu_data, colTop[0].mutable_gpu_data, false);

            if (colTop.Count > 1)

                colTop[1].CopyFrom(m_blobSparseWts);

        }


        private void copyShape(List<int> rg, Blob<T> b)

        {

            rg.Clear();


            for (int i = 0; i < b.shape().Count; i++)

            {

                rg.Add(b.shape(i));

            }

        }


        protected override void backward(BlobCollection<T> colTop, List<bool> rgbPropagateDown, BlobCollection<T> colBottom)

        {

            // Expand the top(0) diff to each channel in the processed inputs.

            int nInnerNum = m_blobProcessedInputs.count(2);

            m_cuda.channel_fillfrom(m_blobProcessedInputs1.count(), m_blobProcessedInputs1.num, m_blobProcessedInputs1.channels, nInnerNum, colTop[0].gpu_diff, m_blobProcessedInputs1.mutable_gpu_diff, DIR.FWD);


            // Apply the transposed smx weightings to the processed inputs.

            m_cuda.channel_mulv(m_blobProcessedInputs.count(), m_blobProcessedInputs.num, m_blobProcessedInputs.channels, nInnerNum, m_blobProcessedInputs1.gpu_diff, m_blobSparseWtsSmxT.gpu_data, m_blobProcessedInputs.mutable_gpu_diff);


            // Calculate the SparseWtsT gradient as

            // sparseWtsT.grad = ProcessedInput.dataT * colTop[0].diff

            copyShape(m_rgShapeOringal, m_blobProcessedInputs);

            copyShape(m_rgShape, m_blobProcessedInputs);

            m_rgShape.Insert(1, 1);

            m_blobProcessedInputs.Reshape(m_rgShape);

            m_blobProcessedInputsT.CopyFromAndTransposeHeightWidth(m_blobProcessedInputs);

            m_blobProcessedInputs.Reshape(m_rgShapeOringal);


            copyShape(m_rgShapeOringal, colTop[0]);

            copyShape(m_rgShape, colTop[0]);

            m_rgShape.Insert(1, 1);

            m_rgShape.Add(1);

            colTop[0].Reshape(m_rgShape);


            m_blobSparseWtsSmxT.MatMul(m_blobProcessedInputsT, colTop[0], true, false, false, 1, false, true, true);

            colTop[0].Reshape(m_rgShapeOringal);


            // Apply the transposed smx weightings to the processed inputs.

            // GRN is applied ot each transformed input.

            for (int i = 0; i < m_param.varselnet_param.num_inputs; i++)

            {

                // Copy the variable specific data to the GRN input.

                m_cuda.channel_copy(m_blobGrn1.count(), m_blobGrn1.num, 1, m_param.varselnet_param.num_inputs, m_blobGrn1.channels, i, colBottom[0].gpu_data, m_blobGrn1.mutable_gpu_data, DIR.FWD);

                // Combine the outputs of the state var GRNs along an additional axis with

                // dimension [(num_samples * num_temporal_steps) x state_size x num_inputs]

                m_cuda.channel_copy(m_blobGrn1.count(), m_blobGrn1.num, m_blobGrn1.channels, m_param.varselnet_param.num_inputs, 1, i, m_blobProcessedInputs.mutable_gpu_diff, m_colSingleVarGrn[i].gpu_diff, DIR.FWD);


                // Each element in the resulting list is of size [(num_samples * num_temporal_steps) x state_size],

                // and each element corresponds to a single input variable.

                addBtmTop(m_blobGrn1, m_colSingleVarGrn[i]);

                m_rgSingleVarGrn[i].Backward(m_colTop, rgbPropagateDown, m_colBtm);


                // Copy the variable specific data to the GRN input.

                m_cuda.channel_copy(m_blobGrn1.count(), m_blobGrn1.num, 1, m_param.varselnet_param.num_inputs, m_blobGrn1.channels, i, m_blobBtm.gpu_diff, m_blobGrn1.mutable_gpu_diff, DIR.BWD);

            }


            // Weigh the processed inputs with the weights viewed as [(num_samples * num_temporal_steps) x 1 x num_inputs]

            // so that the weight given to each variable (for each time-step/observation) multiplies the entire state

            // vector representing the specific input variable on the specific time-step

            addBtmTop(m_blobSparseWtsSmx, m_blobSparseWtsSmxT);

            m_transpose.Backward(m_colTop, rgbPropagateDown, m_colBtm);


            // Sparse weights are of shape [(num_samples * num_temporal_steps) x num_inputs x 1]

            addBtmTop(m_blobSparseWts, m_blobSparseWtsSmx);

            m_softmax.Backward(m_colTop, rgbPropagateDown, m_colBtm);


            // Infer variable selection weights using flattened embedding run through GRN.  The flattened embedding

            // should have shape [(num_samples * num_temporal_steps) x (num_inputs x input_dim)] where the

            // input_dim represents the model_dim or the state_dim.  With static variable selection, num_temporal_Steps

            // is set to 1.

            addBtmTop(colBottom[0], m_blobSparseWts);

            if (colBottom.Count > 1)

                m_colBtm.Add(colBottom[1]);

            m_grnFlatten.Backward(m_colTop, rgbPropagateDown, m_colBtm);


            // Add gradient accumulation from individual variable GRN's.

            m_cuda.add(colBottom[0].count(), colBottom[0].gpu_diff, m_blobBtm.gpu_diff, colBottom[0].mutable_gpu_diff);

        }

    }

}

MyCaffe.basecode.Log
The Log class provides general output in text form.
Definition: Log.cs:13

MyCaffe.basecode.Utility
The Utility class provides general utility funtions.
Definition: Utility.cs:35

MyCaffe.common.BlobCollection
The BlobCollection contains a list of Blobs.
Definition: BlobCollection.cs:16

MyCaffe.common.BlobCollection.Add
void Add(Blob< T > b)
Add a new Blob to the collection.
Definition: BlobCollection.cs:92

MyCaffe.common.BlobCollection.Count
int Count
Returns the number of items in the collection.
Definition: BlobCollection.cs:30

MyCaffe.common.BlobCollection.Clear
void Clear(bool bDispose=false)
Remove all items from the collection.
Definition: BlobCollection.cs:135

MyCaffe.common.BlobCollection.ReshapeLike
void ReshapeLike(BlobCollection< T > src)
Reshapes all blobs in the collection to the sizes of the source.
Definition: BlobCollection.cs:214

MyCaffe.common.BlobCollection.Reshape
void Reshape(int[] rgShape)
Reshapes all blobs in the collection to the given shape.
Definition: BlobCollection.cs:238

MyCaffe.common.BlobCollection.CopyFrom
void CopyFrom(BlobCollection< T > bSrc, bool bCopyDiff=false)
Copy the data or diff from another BlobCollection into this one.
Definition: BlobCollection.cs:266

MyCaffe.common.Blob
The Blob is the main holder of data that moves through the Layers of the Net.
Definition: Blob.cs:25

MyCaffe.common.Blob.channels
int channels
DEPRECIATED; legacy shape accessor channels: use shape(1) instead.
Definition: Blob.cs:800

MyCaffe.common.Blob.MatMul
void MatMul(Blob< T > blobA, Blob< T > blobB, bool bReshape=false, bool bTransA=false, bool bTransB=false, double dfScale=1.0, bool bADiff=false, bool bBDiff=false, bool bCDiff=false)
MatMul blobA with blobB and place the result in this blob (e.g. this = matmul(A, B))....
Definition: Blob.cs:3922

MyCaffe.common.Blob.mutable_gpu_diff
long mutable_gpu_diff
Returns the diff GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1555

MyCaffe.common.Blob.mutable_gpu_data
long mutable_gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1487

MyCaffe.common.Blob.CopyFromAndTransposeHeightWidth
void CopyFromAndTransposeHeightWidth(Blob< T > blobSrc, bool bCopyDiff=false, bool bUseCuda=true)
Copy from a source Blob and transpose the height and width of the copy.
Definition: Blob.cs:1002

MyCaffe.common.Blob.Reshape
void Reshape(int nNum, int nChannels, int nHeight, int nWidth, bool? bUseHalfSize=null)
DEPRECIATED; use
Definition: Blob.cs:442

MyCaffe.common.Blob.CopyFrom
void CopyFrom(Blob< T > src, int nSrcOffset, int nDstOffset, int nCount, bool bCopyData, bool bCopyDiff)
Copy from a source Blob.
Definition: Blob.cs:903

MyCaffe.common.Blob.shape
List< int > shape()
Returns an array where each element contains the shape of an axis of the Blob.
Definition: Blob.cs:684

MyCaffe.common.Blob.count
int count()
Returns the total number of items in the Blob.
Definition: Blob.cs:739

MyCaffe.common.Blob.ReshapeLike
void ReshapeLike(Blob< T > b, bool? bUseHalfSize=null)
Reshape this Blob to have the same shape as another Blob.
Definition: Blob.cs:648

MyCaffe.common.Blob.Name
string Name
Get/set the name of the Blob.
Definition: Blob.cs:2184

MyCaffe.common.Blob.gpu_diff
long gpu_diff
Returns the diff GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1541

MyCaffe.common.Blob.num
int num
DEPRECIATED; legacy shape accessor num: use shape(0) instead.
Definition: Blob.cs:792

MyCaffe.common.Blob.gpu_data
long gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1479

MyCaffe.common.CudaDnn
The CudaDnn object is the main interface to the Low-Level Cuda C++ DLL.
Definition: CudaDnn.cs:969

MyCaffe.layers.Layer
An interface for the units of computation which can be composed into a Net.
Definition: Layer.cs:31

MyCaffe.layers.Layer.m_log
Log m_log
Specifies the Log for output.
Definition: Layer.cs:43

MyCaffe.layers.Layer.m_param
LayerParameter m_param
Specifies the LayerParameter describing the Layer.
Definition: Layer.cs:47

MyCaffe.layers.Layer.Backward
void Backward(BlobCollection< T > colTop, List< bool > rgbPropagateDown, BlobCollection< T > colBottom)
Given the top Blob error gradients, compute the bottom Blob error gradients.
Definition: Layer.cs:815

MyCaffe.layers.Layer.Forward
double Forward(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Given the bottom (input) Blobs, this function computes the top (output) Blobs and the loss.
Definition: Layer.cs:728

MyCaffe.layers.Layer.Reshape
abstract void Reshape(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Adjust the shapes of top blobs and internal buffers to accomodate the shapes of the bottom blobs.

MyCaffe.layers.Layer.Dispose
void Dispose()
Releases all GPU and host resources used by the Layer.
Definition: Layer.cs:180

MyCaffe.layers.Layer.m_cuda
CudaDnn< T > m_cuda
Specifies the CudaDnn connection to Cuda.
Definition: Layer.cs:39

MyCaffe.layers.Layer.Setup
void Setup(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Implements common Layer setup functionality.
Definition: Layer.cs:439

MyCaffe.layers.Layer.Create
static Layer< T > Create(CudaDnn< T > cuda, Log log, LayerParameter p, CancelEvent evtCancel, IXDatabaseBase db=null, TransferInput trxinput=null)
Create a new Layer based on the LayerParameter.
Definition: Layer.cs:1468

MyCaffe.layers.Layer.m_type
LayerParameter.LayerType m_type
Specifies the Layer type.
Definition: Layer.cs:35

MyCaffe.layers.Layer.blobs
BlobCollection< T > blobs
Returns the collection of learnable parameter Blobs for the Layer.
Definition: Layer.cs:875

MyCaffe.layers.Layer.convertLayerParam
LayerParameter convertLayerParam(LayerParameter pChild, LayerParameter pParent)
Called to convert a parent LayerParameterEx, used in blob sharing, with a child layer parameter.
Definition: Layer.cs:1134

MyCaffe.layers.tft.VarSetNetLayer
The VarSetNetLayer implements the Variable Selection Network
Definition: VarSelNetLayer.cs:29

MyCaffe.layers.tft.VarSetNetLayer.forward
override void forward(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Forward computation
Definition: VarSelNetLayer.cs:339

MyCaffe.layers.tft.VarSetNetLayer.Reshape
override void Reshape(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Reshape the top (output) blobs.
Definition: VarSelNetLayer.cs:273

MyCaffe.layers.tft.VarSetNetLayer.MinBottomBlobs
override int MinBottomBlobs
Returns the min number of required bottom (input) Blobs: flattened_embedding
Definition: VarSelNetLayer.cs:127

MyCaffe.layers.tft.VarSetNetLayer.MinTopBlobs
override int MinTopBlobs
Returns the exact number of required top (output) Blobs: outputs_sum
Definition: VarSelNetLayer.cs:143

MyCaffe.layers.tft.VarSetNetLayer.backward
override void backward(BlobCollection< T > colTop, List< bool > rgbPropagateDown, BlobCollection< T > colBottom)
Computes the error gradient w.r.t. the stacked embedding numeric and categorical value inputs.
Definition: VarSelNetLayer.cs:423

MyCaffe.layers.tft.VarSetNetLayer.LayerSetUp
override void LayerSetUp(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Setup the layer.
Definition: VarSelNetLayer.cs:168

MyCaffe.layers.tft.VarSetNetLayer.VarSetNetLayer
VarSetNetLayer(CudaDnn< T > cuda, Log log, LayerParameter p)
The constructor.
Definition: VarSelNetLayer.cs:54

MyCaffe.layers.tft.VarSetNetLayer.setup_internal_blobs
override void setup_internal_blobs(BlobCollection< T > col)
Derivative layers should add all internal blobws to the 'col' provided.
Definition: VarSelNetLayer.cs:108

MyCaffe.layers.tft.VarSetNetLayer.MaxTopBlobs
override int MaxTopBlobs
Returns the exact number of required top (output) Blobs: outputs_sum, sparse_wts
Definition: VarSelNetLayer.cs:151

MyCaffe.layers.tft.VarSetNetLayer.dispose
override void dispose()
Releases all GPU and host resources used by the Layer.
Definition: VarSelNetLayer.cs:78

MyCaffe.layers.tft.VarSetNetLayer.MaxBottomBlobs
override int MaxBottomBlobs
Returns the min number of required bottom (input) Blobs: flattened_embedding, context
Definition: VarSelNetLayer.cs:135

MyCaffe.param.EngineParameter
Specifies whether to use the NVIDIA cuDnn version or Caffe version of a given forward/backward operat...
Definition: EngineParameter.cs:17

MyCaffe.param.EngineParameter.engine
Engine engine
Specifies the Engine in use.
Definition: EngineParameter.cs:49

MyCaffe.param.EngineParameter.Engine
Engine
Defines the type of engine to use.
Definition: EngineParameter.cs:24

MyCaffe.param.LayerParameter
Specifies the base parameter for all layers.
Definition: LayerParameter.cs:24

MyCaffe.param.LayerParameter.name
string name
Specifies the name of this LayerParameter.
Definition: LayerParameter.cs:1865

MyCaffe.param.LayerParameter.softmax_param
SoftmaxParameter softmax_param
Returns the parameter set when initialized with LayerType.SOFTMAX
Definition: LayerParameter.cs:2794

MyCaffe.param.LayerParameter.grn_param
GrnParameter grn_param
Returns the parameter set when initialized with LayerType.GLU
Definition: LayerParameter.cs:2389

MyCaffe.param.LayerParameter.transpose_param
TransposeParameter transpose_param
Returns the parameter set when initialized with LayerType.TRANSPOSE
Definition: LayerParameter.cs:2876

MyCaffe.param.LayerParameter.varselnet_param
VarSelNetParameter varselnet_param
Returns the parameter set when initialized with LayerType.VARSELNET
Definition: LayerParameter.cs:2975

MyCaffe.param.LayerParameter.LayerType
LayerType
Specifies the layer type.
Definition: LayerParameter.cs:110

MyCaffe.param.SoftmaxParameter.axis
int axis
The axis along which to perform the softmax – may be negative to index from the end (e....
Definition: SoftmaxParameter.cs:83

MyCaffe.basecode
The MyCaffe.basecode contains all generic types used throughout MyCaffe.
Definition: Annotation.cs:12

MyCaffe.common
The MyCaffe.common namespace contains common MyCaffe classes.
Definition: BatchInput.cs:8

MyCaffe.common.DIR
DIR
Defines the direction of data flow.
Definition: CudaDnn.cs:22

MyCaffe.common.BLOB_TYPE
BLOB_TYPE
Defines the tpe of data held by a given Blob.
Definition: Interfaces.cs:62

MyCaffe.layers.tft
The MyCaffe.layers.tft namespace contains all TFT related layers.
Definition: LayerFactory.cs:15

MyCaffe.param
The MyCaffe.param namespace contains parameters used to create models.
Definition: AttentionParameter.cs:9

MyCaffe
The MyCaffe namespace contains the main body of MyCaffe code that closesly tracks the C++ Caffe open-...
Definition: Annotation.cs:12

System
Definition: Component.cs:11