mycaffe/html/_softmax_loss_layer_8cs_source.html

using System;

using System.Collections.Generic;

using System.Linq;

using System.Text;

using MyCaffe.basecode;

using MyCaffe.common;

using MyCaffe.param;


namespace MyCaffe.layers

{

    public class SoftmaxLossLayer<T> : LossLayer<T>

    {

        Layer<T> m_softmaxLayer;

        Blob<T> m_blobProb;

        BlobCollection<T> m_colSoftmaxBottom;

        BlobCollection<T> m_colSoftmaxTop;

        int? m_nIgnoreLabel = null;

        int m_nSoftmaxAxis;


        public SoftmaxLossLayer(CudaDnn<T> cuda, Log log, LayerParameter p)

            : base(cuda, log, p)

        {

            m_type = LayerParameter.LayerType.SOFTMAXWITH_LOSS;

            m_blobProb = new Blob<T>(cuda, log);

            m_blobProb.Name = m_param.name + " prob";

        }


        protected override void dispose()

        {

            m_blobProb.Dispose();


            if (m_softmaxLayer != null)

                m_softmaxLayer.Dispose();


            base.dispose();

        }


        protected override void setup_internal_blobs(BlobCollection<T> col)

        {

            if (col.Count > 0)

                return;


            col.Add(m_blobProb);

        }


        public override int ExactNumTopBlobs

        {

            get { return -1; }

        }


        public override int MinTopBlobs

        {

            get { return 1; }

        }


        public override int MaxTopBlobs

        {

            get { return 2; }

        }


        public override void LayerSetUp(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            base.LayerSetUp(colBottom, colTop);


            LayerParameter param_softmax = m_param.Clone(false);

            param_softmax.SetType(LayerParameter.LayerType.SOFTMAX);

            param_softmax.softmax_param = m_param.softmax_param.Clone() as SoftmaxParameter;

            param_softmax.loss_weight.Clear();


            m_softmaxLayer = new SoftmaxLayer<T>(m_cuda, m_log, param_softmax);

            m_colSoftmaxBottom = new BlobCollection<T>();

            m_colSoftmaxTop = new BlobCollection<T>();


            m_colSoftmaxBottom.Add(colBottom[0]);

            m_colSoftmaxTop.Add(m_blobProb);

            m_softmaxLayer.Setup(m_colSoftmaxBottom, m_colSoftmaxTop);


            m_nIgnoreLabel = m_param.loss_param.ignore_label;

        }


        public override void Reshape(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            base.Reshape(colBottom, colTop);


            m_softmaxLayer.Reshape(m_colSoftmaxBottom, m_colSoftmaxTop);

            m_nSoftmaxAxis = colBottom[0].CanonicalAxisIndex(m_param.softmax_param.axis);

            m_nOuterNum = colBottom[0].count(0, m_nSoftmaxAxis);

            m_nInnerNum = colBottom[0].count(m_nSoftmaxAxis + 1);


            if (!m_bIgnoreLabels)

            {

                m_log.CHECK_EQ(m_nOuterNum * m_nInnerNum, colBottom[1].count(), "Number of labels must match number of predictions; e.g., if softmax axis == 1 and prediction shape is (N, C, H, W), label count (number of labels) must be N*H*W, with integer values in {0, 1, ..., C-1}.");


                if (colTop.Count >= 2)

                {

                    // softmax output

                    colTop[1].ReshapeLike(colBottom[0]);

                }

            }

        }


        protected override void forward(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            m_softmaxLayer.Forward(m_colSoftmaxBottom, m_colSoftmaxTop);


            long hProbData = m_blobProb.gpu_data;

            long hLabel = colBottom[1].gpu_data;

            int nDim = m_blobProb.count() / m_nOuterNum;

            int nCount = m_nOuterNum * m_nInnerNum;


            // Since this memory is not used for anything, we use it here to avoid having

            // to allocate new GPU memory to accumulate intermediate results.

            long hLossData = colBottom[0].mutable_gpu_diff;


            // Similarly, this memory is never used elsewhere, and thus we can use it

            // to avoid having to allocate additional GPU memory.

            long hCounts = m_blobProb.mutable_gpu_diff;


            m_cuda.softmaxloss_fwd(nCount, hProbData, hLabel, hLossData, m_nOuterNum, nDim, m_nInnerNum, hCounts, m_nIgnoreLabel);

            T fLoss = m_cuda.asum(nCount, hLossData);

            double dfValidCount = -1;


            // Only launch another cuda kernel if we actually need the count of valid

            // outputs.

            if (m_normalization == LossParameter.NormalizationMode.VALID && m_nIgnoreLabel.HasValue)

                dfValidCount = convertD(m_cuda.asum(nCount, hCounts));


            double dfLoss = convertD(fLoss);

            double dfNormalizer = get_normalizer(m_normalization, (int)dfValidCount);

            double dfFinalLoss = dfLoss / dfNormalizer;


            colTop[0].SetData(dfFinalLoss, 0);


            if (colTop.Count == 2)

                colTop[1].ShareData(m_blobProb);


            // Clear scratch memory to prevent with interfering with backward pass (see #602)

            colBottom[0].SetDiff(0);

        }


        protected override void backward(BlobCollection<T> colTop, List<bool> rgbPropagateDown, BlobCollection<T> colBottom)

        {

            if (!rgbPropagateDown[0])

                return;


            long hBottomDiff = colBottom[0].mutable_gpu_diff;

            long hProbData = m_blobProb.gpu_data;

            long hTopData = colTop[0].gpu_data;


            m_cuda.copy(m_blobProb.count(), hProbData, hBottomDiff);


            long hLabel = colBottom[1].gpu_data;

            int nDim = m_blobProb.count() / m_nOuterNum;

            int nCount = m_nOuterNum * m_nInnerNum;


            // Since this memory is not used for anything else,

            // we use to avoid allocating new GPU memory.

            long hCounts = m_blobProb.mutable_gpu_diff;


            m_cuda.softmaxloss_bwd(nCount, hTopData, hLabel, hBottomDiff, m_nOuterNum, nDim, m_nInnerNum, hCounts, m_nIgnoreLabel);


            double dfValidCount = -1;


            // Only launch another cuda kernel if we acutally need the count of valid

            // outputs.

            if (m_normalization == LossParameter.NormalizationMode.VALID && m_nIgnoreLabel.HasValue)

                dfValidCount = convertD(m_cuda.asum(nCount, hCounts));


            double dfTopDiff = convertD(colTop[0].GetDiff(0));

            double dfNormalizer = get_normalizer(m_normalization, (int)dfValidCount);

            double dfLossWeight = dfTopDiff / dfNormalizer;


            m_cuda.scal(m_blobProb.count(), convert(dfLossWeight), hBottomDiff);

        }

    }

}

MyCaffe.basecode.Log
The Log class provides general output in text form.
Definition: Log.cs:13

MyCaffe.basecode.Log.CHECK_EQ
void CHECK_EQ(double df1, double df2, string str)
Test whether one number is equal to another.
Definition: Log.cs:239

MyCaffe.common.BlobCollection
The BlobCollection contains a list of Blobs.
Definition: BlobCollection.cs:16

MyCaffe.common.BlobCollection.Add
void Add(Blob< T > b)
Add a new Blob to the collection.
Definition: BlobCollection.cs:92

MyCaffe.common.BlobCollection.SetData
void SetData(double df)
Set all blob data to the value specified.
Definition: BlobCollection.cs:323

MyCaffe.common.BlobCollection.SetDiff
void SetDiff(double df)
Set all blob diff to the value specified.
Definition: BlobCollection.cs:311

MyCaffe.common.BlobCollection.Count
int Count
Returns the number of items in the collection.
Definition: BlobCollection.cs:30

MyCaffe.common.BlobCollection.ReshapeLike
void ReshapeLike(BlobCollection< T > src)
Reshapes all blobs in the collection to the sizes of the source.
Definition: BlobCollection.cs:214

MyCaffe.common.Blob
The Blob is the main holder of data that moves through the Layers of the Net.
Definition: Blob.cs:25

MyCaffe.common.Blob.mutable_gpu_diff
long mutable_gpu_diff
Returns the diff GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1555

MyCaffe.common.Blob.count
int count()
Returns the total number of items in the Blob.
Definition: Blob.cs:739

MyCaffe.common.Blob.Name
string Name
Get/set the name of the Blob.
Definition: Blob.cs:2184

MyCaffe.common.Blob.Dispose
virtual void Dispose(bool bDisposing)
Releases all resources used by the Blob (including both GPU and Host).
Definition: Blob.cs:402

MyCaffe.common.Blob.gpu_data
long gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1479

MyCaffe.common.CudaDnn
The CudaDnn object is the main interface to the Low-Level Cuda C++ DLL.
Definition: CudaDnn.cs:969

MyCaffe.layers.Layer
An interface for the units of computation which can be composed into a Net.
Definition: Layer.cs:31

MyCaffe.layers.Layer.m_log
Log m_log
Specifies the Log for output.
Definition: Layer.cs:43

MyCaffe.layers.Layer.m_param
LayerParameter m_param
Specifies the LayerParameter describing the Layer.
Definition: Layer.cs:47

MyCaffe.layers.Layer.convert
void convert(BlobCollection< T > col)
Convert a collection of blobs from / to half size.
Definition: Layer.cs:535

MyCaffe.layers.Layer.convertD
double convertD(T df)
Converts a generic to a double value.
Definition: Layer.cs:1349

MyCaffe.layers.Layer.m_cuda
CudaDnn< T > m_cuda
Specifies the CudaDnn connection to Cuda.
Definition: Layer.cs:39

MyCaffe.layers.Layer.m_type
LayerParameter.LayerType m_type
Specifies the Layer type.
Definition: Layer.cs:35

MyCaffe.layers.LossLayer
The LossLayer provides an interface for Layer's that take two blobs as input – usually (1) prediction...
Definition: LossLayer.cs:23

MyCaffe.layers.LossLayer.m_bIgnoreLabels
bool m_bIgnoreLabels
Set to true when labels are to be ignored.
Definition: LossLayer.cs:31

MyCaffe.layers.LossLayer.m_nOuterNum
int m_nOuterNum
Specifies the outer num, such as the batch count (e.g. count(0, axis)). Each derivative class must se...
Definition: LossLayer.cs:39

MyCaffe.layers.LossLayer.m_nInnerNum
int m_nInnerNum
Specifies the inner num, such as the channel + height + width (e.g. count(axis + 1))....
Definition: LossLayer.cs:43

MyCaffe.layers.LossLayer.get_normalizer
virtual double get_normalizer(LossParameter.NormalizationMode normalization_mode, int nValidCount)
Returns the normalizer used to normalize the loss.
Definition: LossLayer.cs:92

MyCaffe.layers.LossLayer.m_normalization
LossParameter.NormalizationMode m_normalization
Specifies the normalization mode used to normalize the loss.
Definition: LossLayer.cs:35

MyCaffe.layers.SoftmaxLayer
The SoftmaxLayer computes the softmax function. This layer is initialized with the MyCaffe....
Definition: SoftmaxLayer.cs:24

MyCaffe.layers.SoftmaxLossLayer
Computes the multinomial logistic loss for a one-of-many classification task, passing real-valued pre...
Definition: SoftmaxLossLayer.cs:27

MyCaffe.layers.SoftmaxLossLayer.setup_internal_blobs
override void setup_internal_blobs(BlobCollection< T > col)
Derivative layers should add all internal blobws to the 'col' provided.
Definition: SoftmaxLossLayer.cs:67

MyCaffe.layers.SoftmaxLossLayer.SoftmaxLossLayer
SoftmaxLossLayer(CudaDnn< T > cuda, Log log, LayerParameter p)
Constructor.
Definition: SoftmaxLossLayer.cs:47

MyCaffe.layers.SoftmaxLossLayer.dispose
override void dispose()
Releases all GPU and host resources used by the Layer.
Definition: SoftmaxLossLayer.cs:56

MyCaffe.layers.SoftmaxLossLayer.LayerSetUp
override void LayerSetUp(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Setup the layer.
Definition: SoftmaxLossLayer.cs:104

MyCaffe.layers.SoftmaxLossLayer.backward
override void backward(BlobCollection< T > colTop, List< bool > rgbPropagateDown, BlobCollection< T > colBottom)
Computes the softmax loss error gradient w.r.t the predictions.
Definition: SoftmaxLossLayer.cs:237

MyCaffe.layers.SoftmaxLossLayer.MaxTopBlobs
override int MaxTopBlobs
Returns the maximum number of required top (output) Blobs: loss, labels
Definition: SoftmaxLossLayer.cs:95

MyCaffe.layers.SoftmaxLossLayer.MinTopBlobs
override int MinTopBlobs
Returns the minimum number of required top (output) Blobs: loss.
Definition: SoftmaxLossLayer.cs:87

MyCaffe.layers.SoftmaxLossLayer.ExactNumTopBlobs
override int ExactNumTopBlobs
Returns the exact number of required top (output) Blobs as variable.
Definition: SoftmaxLossLayer.cs:79

MyCaffe.layers.SoftmaxLossLayer.Reshape
override void Reshape(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Reshape the bottom (input) and top (output) blobs.
Definition: SoftmaxLossLayer.cs:129

MyCaffe.layers.SoftmaxLossLayer.forward
override void forward(BlobCollection< T > colBottom, BlobCollection< T > colTop)
The forward computation.
Definition: SoftmaxLossLayer.cs:168

MyCaffe.param.LayerParameter
Specifies the base parameter for all layers.
Definition: LayerParameter.cs:24

MyCaffe.param.LayerParameter.name
string name
Specifies the name of this LayerParameter.
Definition: LayerParameter.cs:1865

MyCaffe.param.LayerParameter.loss_weight
List< double > loss_weight
Specifies the loss weight.
Definition: LayerParameter.cs:1955

MyCaffe.param.LayerParameter.softmax_param
SoftmaxParameter softmax_param
Returns the parameter set when initialized with LayerType.SOFTMAX
Definition: LayerParameter.cs:2794

MyCaffe.param.LayerParameter.SetType
void SetType(LayerType type, bool bNewParam=true)
Set the layer type.
Definition: LayerParameter.cs:1900

MyCaffe.param.LayerParameter.LayerType
LayerType
Specifies the layer type.
Definition: LayerParameter.cs:110

MyCaffe.param.LayerParameter.loss_param
LossParameter loss_param
Returns the parameter set when initialized with LayerType.LOSS
Definition: LayerParameter.cs:2027

MyCaffe.param.LayerParameter.Clone
virtual LayerParameter Clone(bool bCloneBlobs)
Creates a new copy of this instance of the parameter.
Definition: LayerParameter.cs:3043

MyCaffe.param.LossParameter
Stores the parameters used by loss layers.
Definition: LossParameter.cs:16

MyCaffe.param.LossParameter.NormalizationMode
NormalizationMode
How to normalize the loss for loss layers that aggregate across batches, spatial dimensions,...
Definition: LossParameter.cs:27

MyCaffe.param.LossParameter.ignore_label
int? ignore_label
If specified, the ignore instances with the given label.
Definition: LossParameter.cs:71

MyCaffe.param.SoftmaxParameter
Specifies the parameters for the SoftmaxLayer
Definition: SoftmaxParameter.cs:23

MyCaffe.param.SoftmaxParameter.Clone
override LayerParameterBase Clone()
Creates a new copy of this instance of the parameter.
Definition: SoftmaxParameter.cs:115

MyCaffe.param.SoftmaxParameter.axis
int axis
The axis along which to perform the softmax – may be negative to index from the end (e....
Definition: SoftmaxParameter.cs:83

MyCaffe.basecode
The MyCaffe.basecode contains all generic types used throughout MyCaffe.
Definition: Annotation.cs:12

MyCaffe.common
The MyCaffe.common namespace contains common MyCaffe classes.
Definition: BatchInput.cs:8

MyCaffe.layers
The MyCaffe.layers namespace contains all layers that have a solidified code base,...
Definition: LayerFactory.cs:15

MyCaffe.param
The MyCaffe.param namespace contains parameters used to create models.
Definition: AttentionParameter.cs:9

MyCaffe
The MyCaffe namespace contains the main body of MyCaffe code that closesly tracks the C++ Caffe open-...
Definition: Annotation.cs:12

System
Definition: Component.cs:11