mycaffe/html/_m_v_n_layer_8cs_source.html

using System;

using System.Collections.Generic;

using System.Linq;

using System.Text;

using MyCaffe.basecode;

using MyCaffe.common;

using MyCaffe.param;


namespace MyCaffe.layers

{

    public class MVNLayer<T> : Layer<T>

    {

        Blob<T> m_blobMean;

        Blob<T> m_blobVariance;

        Blob<T> m_blobTemp;

        // Sum_multiplier is used to carry out sum using BLAS

        Blob<T> m_blobSumMultiplier;

        double m_dfEps;


        public MVNLayer(CudaDnn<T> cuda, Log log, LayerParameter p)

            : base(cuda, log, p)

        {

            m_type = LayerParameter.LayerType.MVN;

            m_blobMean = new common.Blob<T>(cuda, log);

            m_blobMean.Name = m_param.name + " mean";

            m_blobVariance = new common.Blob<T>(cuda, log);

            m_blobVariance.Name = m_param.name + " variance";

            m_blobTemp = new Blob<T>(cuda, log);

            m_blobTemp.Name = m_param.name + " temp";

            m_blobSumMultiplier = new Blob<T>(cuda, log);

            m_blobSumMultiplier.Name = m_param.name + " summult";

        }


        protected override void dispose()

        {

            if (m_blobMean != null)

            {

                m_blobMean.Dispose();

                m_blobMean = null;

            }


            if (m_blobVariance != null)

            {

                m_blobVariance.Dispose();

                m_blobVariance = null;

            }


            if (m_blobTemp != null)

            {

                m_blobTemp.Dispose();

                m_blobTemp = null;

            }


            if (m_blobSumMultiplier != null)

            {

                m_blobSumMultiplier.Dispose();

                m_blobSumMultiplier = null;

            }


            base.dispose();

        }


        protected override void setup_internal_blobs(BlobCollection<T> col)

        {

            if (col.Count > 0)

                return;


            col.Add(m_blobMean);

            col.Add(m_blobVariance);

            col.Add(m_blobTemp);

            col.Add(m_blobSumMultiplier);

        }


        public override int ExactNumBottomBlobs

        {

            get { return 1; }

        }


        public override int ExactNumTopBlobs

        {

            get { return 1; }

        }


        public override void LayerSetUp(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

        }


        public override void Reshape(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            colTop[0].ReshapeLike(colBottom[0]);


            m_blobMean.Reshape(colBottom[0].num, colBottom[0].channels, 1, 1);

            m_blobVariance.Reshape(colBottom[0].num, colBottom[0].channels, 1, 1);

            m_blobTemp.Reshape(colBottom[0].num, colBottom[0].channels, colBottom[0].height, colBottom[0].width);


            if (m_param.mvn_param.across_channels)

                m_blobSumMultiplier.Reshape(1, colBottom[0].channels, colBottom[0].height, colBottom[0].width);

            else

                m_blobSumMultiplier.Reshape(1, 1, colBottom[0].height, colBottom[0].width);


            m_blobSumMultiplier.SetData(1.0);

            m_dfEps = m_param.mvn_param.eps;

        }


        protected override void forward(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            long hBottomData = colBottom[0].gpu_data;

            long hTopData = colTop[0].mutable_gpu_data;

            int nNum = colBottom[0].num;


            if (!m_param.mvn_param.across_channels)

                nNum *= colBottom[0].channels;


            int nDim = colBottom[0].count() / nNum;


            // subtract mean

            m_cuda.gemv(false, nNum, nDim, 1.0 / nDim, hBottomData, m_blobSumMultiplier.gpu_data, 0.0, m_blobMean.mutable_gpu_data); //EX

            m_cuda.gemm(false, false, nNum, nDim, 1, -1.0, m_blobMean.gpu_data, m_blobSumMultiplier.gpu_data, 0.0, m_blobTemp.mutable_gpu_data);

            m_cuda.add(m_blobTemp.count(), hBottomData, m_blobTemp.gpu_data, hTopData); // X-EX


            if (m_param.mvn_param.normalize_variance)

            {

                // compute variance using var(X) = E((X-EX)^2)

                m_cuda.powx(colBottom[0].count(), hTopData, 2.0, m_blobTemp.mutable_gpu_data); // (X-EX)^2

                m_cuda.gemv(false, nNum, nDim, 1.0 / nDim, m_blobTemp.gpu_data, m_blobSumMultiplier.gpu_data, 0.0, m_blobVariance.mutable_gpu_data); // E((X-EX)^2)


                // normalize variance

                m_cuda.powx(m_blobVariance.count(), m_blobVariance.gpu_data, 0.5, m_blobVariance.mutable_gpu_data);

                m_cuda.add_scalar(m_blobVariance.count(), m_dfEps, m_blobVariance.mutable_gpu_data);

                m_cuda.gemm(false, false, nNum, nDim, 1, 1.0, m_blobVariance.gpu_data, m_blobSumMultiplier.gpu_data, 0.0, m_blobTemp.mutable_gpu_data);

                m_cuda.div(m_blobTemp.count(), hTopData, m_blobTemp.gpu_data, hTopData);

            }

        }


        protected override void backward(BlobCollection<T> colTop, List<bool> rgbPropagateDown, BlobCollection<T> colBottom)

        {

            if (!rgbPropagateDown[0])

                return;


            long hTopDiff = colTop[0].gpu_diff;

            long hTopData = colTop[0].gpu_data;

            long hBottomData = colBottom[0].gpu_data;

            long hBottomDiff = colBottom[0].mutable_gpu_diff;

            int nNum = colBottom[0].num;


            if (!m_param.mvn_param.across_channels)

                nNum *= colBottom[0].channels;


            int nDim = colBottom[0].count() / nNum;


            if (m_param.mvn_param.normalize_variance)

            {

                m_cuda.mul(m_blobTemp.count(), hTopData, hTopDiff, hBottomDiff);

                m_cuda.gemv(false, nNum, nDim, 1.0, hBottomDiff, m_blobSumMultiplier.gpu_data, 0.0, m_blobMean.mutable_gpu_data);

                m_cuda.gemm(false, false, nNum, nDim, 1, 1.0, m_blobMean.gpu_data, m_blobSumMultiplier.gpu_data, 0.0, hBottomDiff);

                m_cuda.mul(m_blobTemp.count(), hTopData, hBottomDiff, hBottomDiff);


                m_cuda.gemv(false, nNum, nDim, 1.0, hTopDiff, m_blobSumMultiplier.gpu_data, 0.0, m_blobMean.mutable_gpu_data);

                m_cuda.gemm(false, false, nNum, nDim, 1, 1.0, m_blobMean.gpu_data, m_blobSumMultiplier.gpu_data, 1.0, hBottomDiff);


                m_cuda.axpby(m_blobTemp.count(), 1.0, hTopDiff, -1.0 / nDim, hBottomDiff);


                // put the squares of bottom into temp_

                m_cuda.powx(m_blobTemp.count(), hBottomData, 2.0, m_blobTemp.mutable_gpu_data);

                m_cuda.gemm(false, false, nNum, nDim, 1, 1.0, m_blobVariance.gpu_data, m_blobSumMultiplier.gpu_data, 0.0, m_blobTemp.mutable_gpu_data);

                m_cuda.div(m_blobTemp.count(), hBottomDiff, m_blobTemp.gpu_data, hBottomDiff);

            }

            else

            {

                m_cuda.gemv(false, nNum, nDim, 1.0 / nDim, hTopDiff, m_blobSumMultiplier.gpu_data, 0.0, m_blobMean.mutable_gpu_data);

                m_cuda.gemm(false, false, nNum, nDim, 1, -1.0, m_blobMean.gpu_data, m_blobSumMultiplier.gpu_data, 0.0, m_blobTemp.mutable_gpu_data);

                m_cuda.add(m_blobTemp.count(), hTopDiff, m_blobTemp.gpu_data, hBottomDiff);

            }

        }

    }

}

MyCaffe.basecode.Log
The Log class provides general output in text form.
Definition: Log.cs:13

MyCaffe.common.BlobCollection
The BlobCollection contains a list of Blobs.
Definition: BlobCollection.cs:16

MyCaffe.common.BlobCollection.Add
void Add(Blob< T > b)
Add a new Blob to the collection.
Definition: BlobCollection.cs:92

MyCaffe.common.BlobCollection.Count
int Count
Returns the number of items in the collection.
Definition: BlobCollection.cs:30

MyCaffe.common.BlobCollection.ReshapeLike
void ReshapeLike(BlobCollection< T > src)
Reshapes all blobs in the collection to the sizes of the source.
Definition: BlobCollection.cs:214

MyCaffe.common.Blob
The Blob is the main holder of data that moves through the Layers of the Net.
Definition: Blob.cs:25

MyCaffe.common.Blob.SetData
void SetData(T[] rgData, int nCount=-1, bool bSetCount=true)
Sets a number of items within the Blob's data.
Definition: Blob.cs:1922

MyCaffe.common.Blob.Blob
Blob(CudaDnn< T > cuda, Log log, bool bIncludeDiff=true, bool bUseHalfSize=false)
The Blob constructor.
Definition: Blob.cs:64

MyCaffe.common.Blob.mutable_gpu_data
long mutable_gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1487

MyCaffe.common.Blob.Reshape
void Reshape(int nNum, int nChannels, int nHeight, int nWidth, bool? bUseHalfSize=null)
DEPRECIATED; use
Definition: Blob.cs:442

MyCaffe.common.Blob.count
int count()
Returns the total number of items in the Blob.
Definition: Blob.cs:739

MyCaffe.common.Blob.Name
string Name
Get/set the name of the Blob.
Definition: Blob.cs:2184

MyCaffe.common.Blob.Dispose
virtual void Dispose(bool bDisposing)
Releases all resources used by the Blob (including both GPU and Host).
Definition: Blob.cs:402

MyCaffe.common.Blob.gpu_data
long gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1479

MyCaffe.common.CudaDnn
The CudaDnn object is the main interface to the Low-Level Cuda C++ DLL.
Definition: CudaDnn.cs:969

MyCaffe.layers.Layer
An interface for the units of computation which can be composed into a Net.
Definition: Layer.cs:31

MyCaffe.layers.Layer.m_param
LayerParameter m_param
Specifies the LayerParameter describing the Layer.
Definition: Layer.cs:47

MyCaffe.layers.Layer.m_cuda
CudaDnn< T > m_cuda
Specifies the CudaDnn connection to Cuda.
Definition: Layer.cs:39

MyCaffe.layers.Layer.m_type
LayerParameter.LayerType m_type
Specifies the Layer type.
Definition: Layer.cs:35

MyCaffe.layers.MVNLayer
The "Mean-Variance Normalization" MVNLayer normalizes the input to have 0-mean and/or unit (1) varian...
Definition: MVNLayer.cs:22

MyCaffe.layers.MVNLayer.Reshape
override void Reshape(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Reshape the bottom (input) and top (output) blobs.
Definition: MVNLayer.cs:128

MyCaffe.layers.MVNLayer.forward
override void forward(BlobCollection< T > colBottom, BlobCollection< T > colTop)
The forward computation that computes the normalization.
Definition: MVNLayer.cs:156

MyCaffe.layers.MVNLayer.dispose
override void dispose()
Releases all GPU and host resources used by the Layer.
Definition: MVNLayer.cs:57

MyCaffe.layers.MVNLayer.setup_internal_blobs
override void setup_internal_blobs(BlobCollection< T > col)
Derivative layers should add all internal blobws to the 'col' provided.
Definition: MVNLayer.cs:87

MyCaffe.layers.MVNLayer.MVNLayer
MVNLayer(CudaDnn< T > cuda, Log log, LayerParameter p)
The MVNLayer constructor.
Definition: MVNLayer.cs:42

MyCaffe.layers.MVNLayer.backward
override void backward(BlobCollection< T > colTop, List< bool > rgbPropagateDown, BlobCollection< T > colBottom)
Computes the mvn error gradient w.r.t the output.
Definition: MVNLayer.cs:197

MyCaffe.layers.MVNLayer.ExactNumBottomBlobs
override int ExactNumBottomBlobs
Returns the exact number of required bottom (input) Blobs: input.
Definition: MVNLayer.cs:102

MyCaffe.layers.MVNLayer.LayerSetUp
override void LayerSetUp(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Setup the layer.
Definition: MVNLayer.cs:119

MyCaffe.layers.MVNLayer.ExactNumTopBlobs
override int ExactNumTopBlobs
Returns the exact number of required top (output) Blobs: mvn
Definition: MVNLayer.cs:110

MyCaffe.param.LayerParameter
Specifies the base parameter for all layers.
Definition: LayerParameter.cs:24

MyCaffe.param.LayerParameter.name
string name
Specifies the name of this LayerParameter.
Definition: LayerParameter.cs:1865

MyCaffe.param.LayerParameter.mvn_param
MVNParameter mvn_param
Returns the parameter set when initialized with LayerType.MVN
Definition: LayerParameter.cs:2578

MyCaffe.param.LayerParameter.LayerType
LayerType
Specifies the layer type.
Definition: LayerParameter.cs:110

MyCaffe.param.MVNParameter.eps
double eps
Specifies a small value to avoid divide by zero.
Definition: MVNParameter.cs:57

MyCaffe.param.MVNParameter.across_channels
bool across_channels
Specifies whether or not to normalize accross channels.
Definition: MVNParameter.cs:46

MyCaffe.param.MVNParameter.normalize_variance
bool normalize_variance
Specifies whether or not to normalize the variance.
Definition: MVNParameter.cs:36

MyCaffe.basecode
The MyCaffe.basecode contains all generic types used throughout MyCaffe.
Definition: Annotation.cs:12

MyCaffe.common
The MyCaffe.common namespace contains common MyCaffe classes.
Definition: BatchInput.cs:8

MyCaffe.layers
The MyCaffe.layers namespace contains all layers that have a solidified code base,...
Definition: LayerFactory.cs:15

MyCaffe.param
The MyCaffe.param namespace contains parameters used to create models.
Definition: AttentionParameter.cs:9

MyCaffe
The MyCaffe namespace contains the main body of MyCaffe code that closesly tracks the C++ Caffe open-...
Definition: Annotation.cs:12

System
Definition: Component.cs:11