mycaffe/html/_softmax_cross_entropy2_loss_layer_8cs_source.html

using System;

using System.Collections.Generic;

using System.Linq;

using System.Text;

using MyCaffe.basecode;

using MyCaffe.common;

using MyCaffe.param;


namespace MyCaffe.layers

{

    public class SoftmaxCrossEntropy2LossLayer<T> : LossLayer<T>

    {

        Layer<T> m_softmaxLayer;

        Layer<T> m_logLayer;

        Blob<T> m_blobProb;

        Blob<T> m_blobLogProb;

        Blob<T> m_blobLoss;

        BlobCollection<T> m_colSoftmaxBottomVec = new BlobCollection<T>();

        BlobCollection<T> m_colSoftmaxTopVec = new BlobCollection<T>();

        BlobCollection<T> m_colLogBottomVec = new BlobCollection<T>();

        BlobCollection<T> m_colLogTopVec = new BlobCollection<T>();


        // How to normalize the loss.

        int? m_nIgnoreLabel = null;

        double m_dfNormalizer = 0;

        int m_nSoftmaxAxis = 1;


        public SoftmaxCrossEntropy2LossLayer(CudaDnn<T> cuda, Log log, LayerParameter p)

            : base(cuda, log, p)

        {

            m_type = LayerParameter.LayerType.SOFTMAXCROSSENTROPY2_LOSS;

            m_blobProb = new Blob<T>(cuda, log);

            m_blobProb.Name = m_param.name + " prob";

            m_blobLogProb = new Blob<T>(cuda, log);

            m_blobLogProb.Name = m_param.name + " logprob";

            m_blobLoss = new Blob<T>(cuda, log);

            m_blobLoss.Name = m_param.name + " loss";

        }


        protected override void dispose()

        {

            m_blobProb.Dispose();


            if (m_softmaxLayer != null)

                m_softmaxLayer.Dispose();


            base.dispose();

        }


        protected override void setup_internal_blobs(BlobCollection<T> col)

        {

            if (col.Count > 0)

                return;


            col.Add(m_blobProb);

        }


        public override int ExactNumTopBlobs

        {

            get { return -1; }

        }


        public override int MinTopBlobs

        {

            get { return 1; }

        }


        public override int MaxTopBlobs

        {

            get { return 2; }

        }


        public override void LayerSetUp(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            base.LayerSetUp(colBottom, colTop);


            m_nIgnoreLabel = m_param.loss_param.ignore_label;


            LayerParameter param_softmax = m_param.Clone(false);

            param_softmax.SetType(LayerParameter.LayerType.SOFTMAX);

            param_softmax.softmax_param = m_param.softmax_param.Clone() as SoftmaxParameter;

            param_softmax.loss_weight.Clear();


            m_softmaxLayer = Layer<T>.Create(m_cuda, m_log, param_softmax, null);

            m_colSoftmaxBottomVec = new BlobCollection<T>() { colBottom[0] };

            m_colSoftmaxTopVec = new BlobCollection<T>() { m_blobProb };


            m_softmaxLayer.Setup(m_colSoftmaxBottomVec, m_colSoftmaxTopVec);


            LayerParameter param_log = new LayerParameter(LayerParameter.LayerType.LOG);


            m_logLayer = Layer<T>.Create(m_cuda, m_log, param_log, null);

            m_colLogBottomVec = new BlobCollection<T>() { m_blobProb };

            m_colLogTopVec = new BlobCollection<T>() { m_blobLogProb };


            m_logLayer.Setup(m_colLogBottomVec, m_colLogTopVec);

        }


        public override void Reshape(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            base.Reshape(colBottom, colTop);


            m_blobLoss.ReshapeLike(colBottom[0]);


            m_softmaxLayer.Reshape(m_colSoftmaxBottomVec, m_colSoftmaxTopVec);

            m_logLayer.Reshape(m_colLogBottomVec, m_colLogTopVec);


            m_nSoftmaxAxis = colBottom[0].CanonicalAxisIndex(m_param.softmax_param.axis);

            m_nOuterNum = colBottom[0].count(0, m_nSoftmaxAxis);

            m_nInnerNum = colBottom[0].count(m_nSoftmaxAxis + 1);


            if (!m_bIgnoreLabels)

            {

                m_log.CHECK_EQ(colBottom[0].count(0, m_nSoftmaxAxis), colBottom[1].count(0, m_nSoftmaxAxis), "Number of labels must match number of predictions; e.g., if softmax axis == 1 and prediction shape is (N, C, H, W), label count (number of labels) must be N*H*W, with integer values in {0, 1, ..., C-1}.");


                if (colTop.Count >= 2)

                {

                    // softmax output

                    colTop[1].ReshapeLike(colBottom[0]);

                }

            }

        }


        protected override void forward(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            // The forward pass computes the sotmax outputs (which are probabilities).

            m_softmaxLayer.Forward(m_colSoftmaxBottomVec, m_colSoftmaxTopVec);


            // Run the log on the Probabilities to get LogSoftmax

            m_logLayer.Forward(m_colLogBottomVec, m_colLogTopVec);


            // Use the softmax output for input data.

            long hProbData = m_blobLogProb.gpu_data;

            long hTarget = colBottom[1].gpu_data;

            int nInputCount = m_blobProb.count();

            int nDim = m_blobProb.shape()[m_nSoftmaxAxis];

            int nCount = m_nOuterNum * m_nInnerNum;


            m_blobLoss.SetDiff(0.0);

            long hLossData = m_blobLoss.mutable_gpu_data;

            long hLossDiff = m_blobLoss.mutable_gpu_diff;


            // Since this memory is not used for anything, we use it here to avoid having

            // to allocate the GPU memory to accumulate intermediate results.

            colBottom[1].SetDiff(0);

            long hCountData = colBottom[1].mutable_gpu_diff;


            // Run the NLL Loss portion to get the loss.

            m_cuda.softmax_cross_entropy_fwd(colBottom[0].count(), hProbData, hTarget, hLossDiff, hLossData, m_nOuterNum, nDim, m_nInnerNum, hCountData, m_nIgnoreLabel.GetValueOrDefault(-1));

            double dfLoss = m_cuda.asum_double(colBottom[0].count(), hLossData);


            double dfValidCount = nCount;

            // Only launch another CUDA kernel if we actually need the valid count.

            if (m_normalization == LossParameter.NormalizationMode.VALID && m_nIgnoreLabel.HasValue)

                dfValidCount = m_cuda.asum_double(nCount, hCountData);


            m_dfNormalizer = get_normalizer(m_normalization, (int)dfValidCount);

            double dfFinalLoss = dfLoss / m_dfNormalizer;


            colTop[0].SetData(dfFinalLoss, 0);


            // Return the losses in colTop[1] if it exists.

            if (colTop.Count == 2)

                colTop[1].CopyFrom(m_blobLoss);


            // Clear scratch memory to prevent interfering with the backward pass (see #6202)

            colBottom[1].SetDiff(0);

        }


        protected override void backward(BlobCollection<T> colTop, List<bool> rgbPropagateDown, BlobCollection<T> colBottom)

        {

            if (!rgbPropagateDown[0])

                return;


            // Calculate the NLL Loss Gradient

            float fGrad = convertF(colTop[0].GetDiff(0));

            fGrad = -1.0f * fGrad / (float)m_dfNormalizer;


            m_blobLoss.scale_diff(fGrad);


            // Calculate the log gradient.

            m_blobLogProb.CopyFrom(m_blobLoss, true);

            m_logLayer.Backward(m_colLogTopVec, rgbPropagateDown, m_colLogBottomVec);


            // Calculate the Softmax gradient.

            m_softmaxLayer.Backward(m_colSoftmaxTopVec, rgbPropagateDown, m_colSoftmaxBottomVec);

        }

    }

}

MyCaffe.basecode.Log
The Log class provides general output in text form.
Definition: Log.cs:13

MyCaffe.basecode.Log.CHECK_EQ
void CHECK_EQ(double df1, double df2, string str)
Test whether one number is equal to another.
Definition: Log.cs:239

MyCaffe.common.BlobCollection
The BlobCollection contains a list of Blobs.
Definition: BlobCollection.cs:16

MyCaffe.common.BlobCollection.Add
void Add(Blob< T > b)
Add a new Blob to the collection.
Definition: BlobCollection.cs:92

MyCaffe.common.BlobCollection.SetData
void SetData(double df)
Set all blob data to the value specified.
Definition: BlobCollection.cs:323

MyCaffe.common.BlobCollection.SetDiff
void SetDiff(double df)
Set all blob diff to the value specified.
Definition: BlobCollection.cs:311

MyCaffe.common.BlobCollection.Count
int Count
Returns the number of items in the collection.
Definition: BlobCollection.cs:30

MyCaffe.common.BlobCollection.ReshapeLike
void ReshapeLike(BlobCollection< T > src)
Reshapes all blobs in the collection to the sizes of the source.
Definition: BlobCollection.cs:214

MyCaffe.common.BlobCollection.CopyFrom
void CopyFrom(BlobCollection< T > bSrc, bool bCopyDiff=false)
Copy the data or diff from another BlobCollection into this one.
Definition: BlobCollection.cs:266

MyCaffe.common.Blob
The Blob is the main holder of data that moves through the Layers of the Net.
Definition: Blob.cs:25

MyCaffe.common.Blob.mutable_gpu_diff
long mutable_gpu_diff
Returns the diff GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1555

MyCaffe.common.Blob.mutable_gpu_data
long mutable_gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1487

MyCaffe.common.Blob.CopyFrom
void CopyFrom(Blob< T > src, int nSrcOffset, int nDstOffset, int nCount, bool bCopyData, bool bCopyDiff)
Copy from a source Blob.
Definition: Blob.cs:903

MyCaffe.common.Blob.shape
List< int > shape()
Returns an array where each element contains the shape of an axis of the Blob.
Definition: Blob.cs:684

MyCaffe.common.Blob.count
int count()
Returns the total number of items in the Blob.
Definition: Blob.cs:739

MyCaffe.common.Blob.ReshapeLike
void ReshapeLike(Blob< T > b, bool? bUseHalfSize=null)
Reshape this Blob to have the same shape as another Blob.
Definition: Blob.cs:648

MyCaffe.common.Blob.Name
string Name
Get/set the name of the Blob.
Definition: Blob.cs:2184

MyCaffe.common.Blob.Dispose
virtual void Dispose(bool bDisposing)
Releases all resources used by the Blob (including both GPU and Host).
Definition: Blob.cs:402

MyCaffe.common.Blob.scale_diff
void scale_diff(double df)
Scale the diff by a scaling factor.
Definition: Blob.cs:1763

MyCaffe.common.Blob.SetDiff
void SetDiff(double dfVal, int nIdx=-1)
Either sets all of the diff items in the Blob to a given value, or alternatively only sets a single i...
Definition: Blob.cs:1981

MyCaffe.common.Blob.gpu_data
long gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1479

MyCaffe.common.CudaDnn
The CudaDnn object is the main interface to the Low-Level Cuda C++ DLL.
Definition: CudaDnn.cs:969

MyCaffe.layers.Layer
An interface for the units of computation which can be composed into a Net.
Definition: Layer.cs:31

MyCaffe.layers.Layer.m_log
Log m_log
Specifies the Log for output.
Definition: Layer.cs:43

MyCaffe.layers.Layer.m_param
LayerParameter m_param
Specifies the LayerParameter describing the Layer.
Definition: Layer.cs:47

MyCaffe.layers.Layer.Backward
void Backward(BlobCollection< T > colTop, List< bool > rgbPropagateDown, BlobCollection< T > colBottom)
Given the top Blob error gradients, compute the bottom Blob error gradients.
Definition: Layer.cs:815

MyCaffe.layers.Layer.Forward
double Forward(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Given the bottom (input) Blobs, this function computes the top (output) Blobs and the loss.
Definition: Layer.cs:728

MyCaffe.layers.Layer.convertF
float convertF(T df)
Converts a generic to a float value.
Definition: Layer.cs:1359

MyCaffe.layers.Layer.Reshape
abstract void Reshape(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Adjust the shapes of top blobs and internal buffers to accomodate the shapes of the bottom blobs.

MyCaffe.layers.Layer.m_cuda
CudaDnn< T > m_cuda
Specifies the CudaDnn connection to Cuda.
Definition: Layer.cs:39

MyCaffe.layers.Layer.Setup
void Setup(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Implements common Layer setup functionality.
Definition: Layer.cs:439

MyCaffe.layers.Layer.Create
static Layer< T > Create(CudaDnn< T > cuda, Log log, LayerParameter p, CancelEvent evtCancel, IXDatabaseBase db=null, TransferInput trxinput=null)
Create a new Layer based on the LayerParameter.
Definition: Layer.cs:1468

MyCaffe.layers.Layer.m_type
LayerParameter.LayerType m_type
Specifies the Layer type.
Definition: Layer.cs:35

MyCaffe.layers.LossLayer
The LossLayer provides an interface for Layer's that take two blobs as input – usually (1) prediction...
Definition: LossLayer.cs:23

MyCaffe.layers.LossLayer.m_bIgnoreLabels
bool m_bIgnoreLabels
Set to true when labels are to be ignored.
Definition: LossLayer.cs:31

MyCaffe.layers.LossLayer.m_nOuterNum
int m_nOuterNum
Specifies the outer num, such as the batch count (e.g. count(0, axis)). Each derivative class must se...
Definition: LossLayer.cs:39

MyCaffe.layers.LossLayer.m_nInnerNum
int m_nInnerNum
Specifies the inner num, such as the channel + height + width (e.g. count(axis + 1))....
Definition: LossLayer.cs:43

MyCaffe.layers.LossLayer.get_normalizer
virtual double get_normalizer(LossParameter.NormalizationMode normalization_mode, int nValidCount)
Returns the normalizer used to normalize the loss.
Definition: LossLayer.cs:92

MyCaffe.layers.LossLayer.m_normalization
LossParameter.NormalizationMode m_normalization
Specifies the normalization mode used to normalize the loss.
Definition: LossLayer.cs:35

MyCaffe.layers.SoftmaxCrossEntropy2LossLayer
The SoftmaxCrossEntropy2Layer computes the cross-entropy (logisitic) loss and is often used for predi...
Definition: SoftmaxCrossEntropy2LossLayer.cs:17

MyCaffe.layers.SoftmaxCrossEntropy2LossLayer.SoftmaxCrossEntropy2LossLayer
SoftmaxCrossEntropy2LossLayer(CudaDnn< T > cuda, Log log, LayerParameter p)
The SoftmaxCrossEntropyLayer constructor.
Definition: SoftmaxCrossEntropy2LossLayer.cs:40

MyCaffe.layers.SoftmaxCrossEntropy2LossLayer.backward
override void backward(BlobCollection< T > colTop, List< bool > rgbPropagateDown, BlobCollection< T > colBottom)
Computes the softmax cross entropy loss error gradient w.r.t the predictions.
Definition: SoftmaxCrossEntropy2LossLayer.cs:251

MyCaffe.layers.SoftmaxCrossEntropy2LossLayer.MaxTopBlobs
override int MaxTopBlobs
Returns the maximum number of required top (output) Blobs: loss, loss values
Definition: SoftmaxCrossEntropy2LossLayer.cs:92

MyCaffe.layers.SoftmaxCrossEntropy2LossLayer.LayerSetUp
override void LayerSetUp(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Setup the layer.
Definition: SoftmaxCrossEntropy2LossLayer.cs:101

MyCaffe.layers.SoftmaxCrossEntropy2LossLayer.MinTopBlobs
override int MinTopBlobs
Returns the minimum number of required top (output) Blobs: loss.
Definition: SoftmaxCrossEntropy2LossLayer.cs:84

MyCaffe.layers.SoftmaxCrossEntropy2LossLayer.ExactNumTopBlobs
override int ExactNumTopBlobs
Returns the exact number of required top (output) Blobs as variable.
Definition: SoftmaxCrossEntropy2LossLayer.cs:76

MyCaffe.layers.SoftmaxCrossEntropy2LossLayer.setup_internal_blobs
override void setup_internal_blobs(BlobCollection< T > col)
Derivative layers should add all internal blobws to the 'col' provided.
Definition: SoftmaxCrossEntropy2LossLayer.cs:64

MyCaffe.layers.SoftmaxCrossEntropy2LossLayer.Reshape
override void Reshape(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Reshape the bottom (input) and top (output) blobs.
Definition: SoftmaxCrossEntropy2LossLayer.cs:132

MyCaffe.layers.SoftmaxCrossEntropy2LossLayer.forward
override void forward(BlobCollection< T > colBottom, BlobCollection< T > colTop)
The forward computation for softmax cross entropy loss.
Definition: SoftmaxCrossEntropy2LossLayer.cs:175

MyCaffe.layers.SoftmaxCrossEntropy2LossLayer.dispose
override void dispose()
Releases all GPU and host resources used by the Layer.
Definition: SoftmaxCrossEntropy2LossLayer.cs:53

MyCaffe.param.LayerParameter
Specifies the base parameter for all layers.
Definition: LayerParameter.cs:24

MyCaffe.param.LayerParameter.name
string name
Specifies the name of this LayerParameter.
Definition: LayerParameter.cs:1865

MyCaffe.param.LayerParameter.loss_weight
List< double > loss_weight
Specifies the loss weight.
Definition: LayerParameter.cs:1955

MyCaffe.param.LayerParameter.softmax_param
SoftmaxParameter softmax_param
Returns the parameter set when initialized with LayerType.SOFTMAX
Definition: LayerParameter.cs:2794

MyCaffe.param.LayerParameter.SetType
void SetType(LayerType type, bool bNewParam=true)
Set the layer type.
Definition: LayerParameter.cs:1900

MyCaffe.param.LayerParameter.LayerType
LayerType
Specifies the layer type.
Definition: LayerParameter.cs:110

MyCaffe.param.LayerParameter.loss_param
LossParameter loss_param
Returns the parameter set when initialized with LayerType.LOSS
Definition: LayerParameter.cs:2027

MyCaffe.param.LayerParameter.Clone
virtual LayerParameter Clone(bool bCloneBlobs)
Creates a new copy of this instance of the parameter.
Definition: LayerParameter.cs:3043

MyCaffe.param.LossParameter
Stores the parameters used by loss layers.
Definition: LossParameter.cs:16

MyCaffe.param.LossParameter.NormalizationMode
NormalizationMode
How to normalize the loss for loss layers that aggregate across batches, spatial dimensions,...
Definition: LossParameter.cs:27

MyCaffe.param.LossParameter.ignore_label
int? ignore_label
If specified, the ignore instances with the given label.
Definition: LossParameter.cs:71

MyCaffe.param.SoftmaxParameter
Specifies the parameters for the SoftmaxLayer
Definition: SoftmaxParameter.cs:23

MyCaffe.param.SoftmaxParameter.Clone
override LayerParameterBase Clone()
Creates a new copy of this instance of the parameter.
Definition: SoftmaxParameter.cs:115

MyCaffe.param.SoftmaxParameter.axis
int axis
The axis along which to perform the softmax – may be negative to index from the end (e....
Definition: SoftmaxParameter.cs:83

MyCaffe.basecode
The MyCaffe.basecode contains all generic types used throughout MyCaffe.
Definition: Annotation.cs:12

MyCaffe.common
The MyCaffe.common namespace contains common MyCaffe classes.
Definition: BatchInput.cs:8

MyCaffe.layers
The MyCaffe.layers namespace contains all layers that have a solidified code base,...
Definition: LayerFactory.cs:15

MyCaffe.param
The MyCaffe.param namespace contains parameters used to create models.
Definition: AttentionParameter.cs:9

MyCaffe
The MyCaffe namespace contains the main body of MyCaffe code that closesly tracks the C++ Caffe open-...
Definition: Annotation.cs:12

System
Definition: Component.cs:11