mycaffe/html/_quantile_loss_layer_8cs_source.html

using System;

using System.Collections.Generic;

using System.Diagnostics;

using System.IO;

using System.Linq;

using System.Text;

using MyCaffe.basecode;

using MyCaffe.common;

using MyCaffe.param;


namespace MyCaffe.layers

{

    public class QuantileLossLayer<T> : LossLayer<T>

    {

        List<int> m_rgShape = new List<int>(4);

        int m_nCount;

        int m_nChannels;

        Blob<T> m_blobTargetsFull;

        Blob<T> m_blobErrors;

        Blob<T> m_blobQuantile1;

        Blob<T> m_blobQuantile2;

        Blob<T> m_blobDesiredQuantiles;

        Blob<T> m_blobLoss;

        Blob<T> m_blobLossSum;

        Blob<T> m_blobLossSumMean;

        Blob<T> m_blobWork;


        public QuantileLossLayer(CudaDnn<T> cuda, Log log, LayerParameter p)

            : base(cuda, log, p)

        {

            m_type = LayerParameter.LayerType.QUANTILE_LOSS;


            m_blobErrors = new Blob<T>(cuda, log);

            m_blobErrors.Name = m_param.name + ".diff";

            m_blobTargetsFull = new Blob<T>(cuda, log);

            m_blobTargetsFull.Name = m_param.name + ".trgtfull";

            m_blobQuantile1 = new Blob<T>(cuda, log);

            m_blobQuantile1.Name = m_param.name + ".qtl1";

            m_blobQuantile2 = new Blob<T>(cuda, log);

            m_blobQuantile2.Name = m_param.name + ".qtl2";

            m_blobDesiredQuantiles = new Blob<T>(cuda, log);

            m_blobDesiredQuantiles.Name = m_param.name + ".desqtl";

            m_blobLoss = new Blob<T>(cuda, log);

            m_blobLoss.Name = m_param.name + ".loss";

            m_blobLossSum = new Blob<T>(cuda, log);

            m_blobLossSum.Name = m_param.name + ".losssum";

            m_blobLossSumMean = new Blob<T>(cuda, log);

            m_blobLossSumMean.Name = m_param.name + ".losssum.mean";

            m_blobWork = new Blob<T>(m_cuda, m_log);

            m_blobWork.Name = m_param.name + ".work";

        }


        protected override void dispose()

        {

            dispose(ref m_blobErrors);

            dispose(ref m_blobQuantile1);

            dispose(ref m_blobQuantile2);

            dispose(ref m_blobTargetsFull);

            dispose(ref m_blobDesiredQuantiles);

            dispose(ref m_blobLoss);

            dispose(ref m_blobLossSum);

            dispose(ref m_blobLossSumMean);

            dispose(ref m_blobWork);


            base.dispose();

        }


        public override int ExactNumTopBlobs

        {

            get { return -1; }

        }


        public override int MinTopBlobs

        {

            get { return 1; }

        }


        public override int MaxTopBlobs

        {

            get { return 2; }

        }


        public override bool AllowForceBackward(int nBottomIdx)

        {

            return true;

        }


        public override void LayerSetUp(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            base.LayerSetUp(colBottom, colTop);


            List<int> rgShape = new List<int>(1);

            rgShape.Add(m_param.quantile_loss_param.desired_quantiles.Count);

            m_blobDesiredQuantiles.Reshape(rgShape);


            float[] rgDeqQtl1 = new float[m_param.quantile_loss_param.desired_quantiles.Count];

            float[] rgDeqQtl2 = new float[m_param.quantile_loss_param.desired_quantiles.Count];


            for (int i = 0; i < rgDeqQtl1.Length; i++)

            {

                rgDeqQtl1[i] = m_param.quantile_loss_param.desired_quantiles[i];

                rgDeqQtl2[i] = rgDeqQtl1[i] - 1;

            }


            m_blobDesiredQuantiles.mutable_cpu_data = convert(rgDeqQtl1);

            m_blobDesiredQuantiles.mutable_cpu_diff = convert(rgDeqQtl2);


        }


        public override void Reshape(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            base.Reshape(colBottom, colTop);


            int nAxes = colBottom[0].num_axes;

            m_nCount = colBottom[0].count();

            m_nOuterNum = colBottom[0].num;

            m_nChannels = (nAxes == 2) ? 1 : colBottom[0].channels;

            m_nInnerNum = (nAxes == 2) ? colBottom[0].channels : colBottom[0].count(2);


            m_log.CHECK_EQ(colBottom[0].num, colBottom[1].num, "Input and target must have same 'num' size.");

            m_log.CHECK_EQ(colBottom[0].channels, colBottom[1].channels, "Input and target must have same 'channel' size.");

            m_log.CHECK_EQ(colBottom[0].height, colBottom[1].height * m_param.quantile_loss_param.desired_quantiles.Count, "Input must have 'desired_quantile.Count' * target 'height' size.");


            m_blobErrors.ReshapeLike(colBottom[0]);

            m_blobTargetsFull.ReshapeLike(colBottom[0]);

            m_blobQuantile1.ReshapeLike(colBottom[0]);

            m_blobQuantile2.ReshapeLike(colBottom[0]);

            m_blobLoss.ReshapeLike(colBottom[0]);

            m_blobWork.ReshapeLike(colBottom[0]);


            m_rgShape.Clear();

            m_rgShape.Add(m_nOuterNum);

            m_rgShape.Add(m_nChannels);

            m_blobLossSum.Reshape(m_rgShape);


            m_rgShape.Clear();

            m_rgShape.Add(m_nOuterNum);

            m_blobLossSumMean.Reshape(m_rgShape);


            m_rgShape.Clear();

            m_rgShape.Add(1);

            colTop[0].Reshape(m_rgShape);


            if (colTop.Count > 1)

            {

                m_rgShape[0] = m_nChannels;

                colTop[1].Reshape(m_rgShape);

            }

        }


        protected override void forward(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            // Fill the targets accross all output quantiles.

            m_cuda.channel_fillfrom(m_nCount, m_nOuterNum, m_nChannels, m_nInnerNum, colBottom[1].gpu_data, m_blobTargetsFull.mutable_gpu_data, DIR.FWD);


            // Compute the actual error between the observed target and each predicted quantile

            m_cuda.sub(m_nCount, m_blobTargetsFull.gpu_data, colBottom[0].gpu_data, m_blobErrors.mutable_gpu_data);


            // Compute the loss separately for each sample, time-step, quantile

            m_cuda.channel_copyall(m_nCount, m_nOuterNum * m_nChannels, 1, m_nInnerNum, m_blobDesiredQuantiles.gpu_diff, m_blobWork.mutable_gpu_data);

            m_cuda.mul(m_nCount, m_blobWork.gpu_data, m_blobErrors.gpu_data, m_blobQuantile1.mutable_gpu_data);


            m_cuda.channel_copyall(m_nCount, m_nOuterNum * m_nChannels, 1, m_nInnerNum, m_blobDesiredQuantiles.gpu_data, m_blobWork.mutable_gpu_data);

            m_cuda.mul(m_nCount, m_blobWork.gpu_data, m_blobErrors.gpu_data, m_blobQuantile2.mutable_gpu_data);


            m_cuda.max(m_nCount, m_blobQuantile2.gpu_data, m_blobQuantile1.gpu_data, m_blobLoss.mutable_gpu_data);


            // Sum losses over the quantiles

            m_cuda.channel_sum(m_nCount, m_nOuterNum, m_nChannels, m_nInnerNum, m_blobLoss.gpu_data, m_blobLossSum.mutable_gpu_data, false);


            // Mean of Sum losses over time

            m_cuda.channel_mean(m_blobLossSum.count(), m_nOuterNum, 1, m_nChannels, m_blobLossSum.gpu_data, m_blobLossSumMean.mutable_gpu_data);


            // Average across time and observations

            double dfQLoss = m_blobLossSumMean.mean();

            colTop[0].SetData(dfQLoss, 0);


            // Calculate the q-risk for each quantile

            if (colTop.Count > 1)

            {

                double dfTargetSum = convertD(colBottom[1].asum_data());

                m_cuda.channel_sum(m_blobLossSum.count(), 1, m_nOuterNum, m_nChannels, m_blobLossSum.gpu_data, colTop[1].mutable_gpu_data, true);


                colTop[1].scale_data(2.0 / dfTargetSum);

            }


            callLossEvent(m_blobLossSumMean);

        }


        protected override void backward(BlobCollection<T> colTop, List<bool> rgbPropagateDown, BlobCollection<T> colBottom)

        {

            if (!rgbPropagateDown[0])

                return;


            // Sum and average over quantiles, time and observations

            double dfGrad = convertD(colTop[0].GetDiff(0));

            m_blobLoss.SetDiff(dfGrad / (m_nOuterNum * m_nChannels));


            // Compute the grad separately for each sample, time-step, quantile

            m_cuda.max_bwd(m_nCount, m_blobQuantile2.gpu_data, m_blobQuantile1.gpu_data, m_blobLoss.gpu_diff, m_blobQuantile2.mutable_gpu_diff, m_blobQuantile1.mutable_gpu_diff);


            m_cuda.channel_copyall(m_nCount, m_nOuterNum * m_nChannels, 1, m_nInnerNum, m_blobDesiredQuantiles.gpu_data, m_blobWork.mutable_gpu_data);

            m_cuda.mul(m_nCount, m_blobWork.gpu_data, m_blobQuantile2.gpu_diff, m_blobQuantile2.mutable_gpu_diff);


            m_cuda.channel_copyall(m_nCount, m_nOuterNum * m_nChannels, 1, m_nInnerNum, m_blobDesiredQuantiles.gpu_diff, m_blobWork.mutable_gpu_data);

            m_cuda.mul(m_nCount, m_blobWork.gpu_data, m_blobQuantile1.gpu_diff, m_blobQuantile1.mutable_gpu_diff);


            m_cuda.add(m_nCount, m_blobQuantile1.gpu_diff, m_blobQuantile2.gpu_diff, m_blobErrors.mutable_gpu_diff);


            // Compute the actual grad between the observed target and each predicted quantile

            m_cuda.scale(m_nCount, -1.0, m_blobErrors.gpu_diff, colBottom[0].mutable_gpu_diff);

        }

    }

}

MyCaffe.basecode.Log
The Log class provides general output in text form.
Definition: Log.cs:13

MyCaffe.basecode.Log.CHECK_EQ
void CHECK_EQ(double df1, double df2, string str)
Test whether one number is equal to another.
Definition: Log.cs:239

MyCaffe.common.BlobCollection
The BlobCollection contains a list of Blobs.
Definition: BlobCollection.cs:16

MyCaffe.common.BlobCollection.SetData
void SetData(double df)
Set all blob data to the value specified.
Definition: BlobCollection.cs:323

MyCaffe.common.BlobCollection.Count
int Count
Returns the number of items in the collection.
Definition: BlobCollection.cs:30

MyCaffe.common.BlobCollection.Reshape
void Reshape(int[] rgShape)
Reshapes all blobs in the collection to the given shape.
Definition: BlobCollection.cs:238

MyCaffe.common.Blob
The Blob is the main holder of data that moves through the Layers of the Net.
Definition: Blob.cs:25

MyCaffe.common.Blob.mutable_gpu_diff
long mutable_gpu_diff
Returns the diff GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1555

MyCaffe.common.Blob.mutable_cpu_diff
T[] mutable_cpu_diff
Get diff from the GPU and bring it over to the host, or Set diff from the Host and send it over to th...
Definition: Blob.cs:1511

MyCaffe.common.Blob.mutable_gpu_data
long mutable_gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1487

MyCaffe.common.Blob.mutable_cpu_data
T[] mutable_cpu_data
Get data from the GPU and bring it over to the host, or Set data from the Host and send it over to th...
Definition: Blob.cs:1461

MyCaffe.common.Blob.Reshape
void Reshape(int nNum, int nChannels, int nHeight, int nWidth, bool? bUseHalfSize=null)
DEPRECIATED; use
Definition: Blob.cs:442

MyCaffe.common.Blob.mean
double mean(float[] rgDf=null, bool bDiff=false)
Calculate the mean of the blob data.
Definition: Blob.cs:2965

MyCaffe.common.Blob.count
int count()
Returns the total number of items in the Blob.
Definition: Blob.cs:739

MyCaffe.common.Blob.ReshapeLike
void ReshapeLike(Blob< T > b, bool? bUseHalfSize=null)
Reshape this Blob to have the same shape as another Blob.
Definition: Blob.cs:648

MyCaffe.common.Blob.Name
string Name
Get/set the name of the Blob.
Definition: Blob.cs:2184

MyCaffe.common.Blob.gpu_diff
long gpu_diff
Returns the diff GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1541

MyCaffe.common.Blob.SetDiff
void SetDiff(double dfVal, int nIdx=-1)
Either sets all of the diff items in the Blob to a given value, or alternatively only sets a single i...
Definition: Blob.cs:1981

MyCaffe.common.Blob.gpu_data
long gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1479

MyCaffe.common.CudaDnn
The CudaDnn object is the main interface to the Low-Level Cuda C++ DLL.
Definition: CudaDnn.cs:969

MyCaffe.layers.Layer.m_log
Log m_log
Specifies the Log for output.
Definition: Layer.cs:43

MyCaffe.layers.Layer.m_param
LayerParameter m_param
Specifies the LayerParameter describing the Layer.
Definition: Layer.cs:47

MyCaffe.layers.Layer.convert
void convert(BlobCollection< T > col)
Convert a collection of blobs from / to half size.
Definition: Layer.cs:535

MyCaffe.layers.Layer.convertD
double convertD(T df)
Converts a generic to a double value.
Definition: Layer.cs:1349

MyCaffe.layers.Layer.m_cuda
CudaDnn< T > m_cuda
Specifies the CudaDnn connection to Cuda.
Definition: Layer.cs:39

MyCaffe.layers.Layer.m_type
LayerParameter.LayerType m_type
Specifies the Layer type.
Definition: Layer.cs:35

MyCaffe.layers.LossLayer
The LossLayer provides an interface for Layer's that take two blobs as input – usually (1) prediction...
Definition: LossLayer.cs:23

MyCaffe.layers.LossLayer.m_nOuterNum
int m_nOuterNum
Specifies the outer num, such as the batch count (e.g. count(0, axis)). Each derivative class must se...
Definition: LossLayer.cs:39

MyCaffe.layers.LossLayer.m_nInnerNum
int m_nInnerNum
Specifies the inner num, such as the channel + height + width (e.g. count(axis + 1))....
Definition: LossLayer.cs:43

MyCaffe.layers.LossLayer.callLossEvent
void callLossEvent(Blob< T > blob)
This method is called by the loss layer to pass the blob data to the OnLoss event (if implemented)
Definition: LossLayer.cs:72

MyCaffe.layers.QuantileLossLayer
The QuantileLossLayer computes the quantile loss  for real-valued regression tasks.
Definition: QuantileLossLayer.cs:27

MyCaffe.layers.QuantileLossLayer.LayerSetUp
override void LayerSetUp(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Setup the layer.
Definition: QuantileLossLayer.cs:128

MyCaffe.layers.QuantileLossLayer.forward
override void forward(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Forward computation
Definition: QuantileLossLayer.cs:212

MyCaffe.layers.QuantileLossLayer.ExactNumTopBlobs
override int ExactNumTopBlobs
Returns the exact number of required top (output) Blobs as variable.
Definition: QuantileLossLayer.cs:92

MyCaffe.layers.QuantileLossLayer.backward
override void backward(BlobCollection< T > colTop, List< bool > rgbPropagateDown, BlobCollection< T > colBottom)
Computes the QuantileLoss error gradient w.r.t. the inputs.
Definition: QuantileLossLayer.cs:273

MyCaffe.layers.QuantileLossLayer.MinTopBlobs
override int MinTopBlobs
Returns the minimum number of required top (output) Blobs: loss.
Definition: QuantileLossLayer.cs:100

MyCaffe.layers.QuantileLossLayer.dispose
override void dispose()
Releases all GPU and host resources used by the Layer.
Definition: QuantileLossLayer.cs:73

MyCaffe.layers.QuantileLossLayer.Reshape
override void Reshape(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Reshape the bottom (input) and top (output) blobs.
Definition: QuantileLossLayer.cs:156

MyCaffe.layers.QuantileLossLayer.QuantileLossLayer
QuantileLossLayer(CudaDnn< T > cuda, Log log, LayerParameter p)
The QuantileLossLayer constructor
Definition: QuantileLossLayer.cs:47

MyCaffe.layers.QuantileLossLayer.MaxTopBlobs
override int MaxTopBlobs
Returns the maximum number of required top (output) Blobs: loss, q_risk
Definition: QuantileLossLayer.cs:108

MyCaffe.layers.QuantileLossLayer.AllowForceBackward
override bool AllowForceBackward(int nBottomIdx)
Unlike most loss layers, in the QuantileLossLayer we can backpropagate to both inputs – override to r...
Definition: QuantileLossLayer.cs:118

MyCaffe.param.LayerParameter
Specifies the base parameter for all layers.
Definition: LayerParameter.cs:24

MyCaffe.param.LayerParameter.name
string name
Specifies the name of this LayerParameter.
Definition: LayerParameter.cs:1865

MyCaffe.param.LayerParameter.quantile_loss_param
QuantileLossParameter quantile_loss_param
Returns the parameter set when initialized with LayerType.QUANTILE_LOSS
Definition: LayerParameter.cs:2704

MyCaffe.param.LayerParameter.LayerType
LayerType
Specifies the layer type.
Definition: LayerParameter.cs:110

MyCaffe.basecode
The MyCaffe.basecode contains all generic types used throughout MyCaffe.
Definition: Annotation.cs:12

MyCaffe.common
The MyCaffe.common namespace contains common MyCaffe classes.
Definition: BatchInput.cs:8

MyCaffe.common.DIR
DIR
Defines the direction of data flow.
Definition: CudaDnn.cs:22

MyCaffe.layers
The MyCaffe.layers namespace contains all layers that have a solidified code base,...
Definition: LayerFactory.cs:15

MyCaffe.param
The MyCaffe.param namespace contains parameters used to create models.
Definition: AttentionParameter.cs:9

MyCaffe
The MyCaffe namespace contains the main body of MyCaffe code that closesly tracks the C++ Caffe open-...
Definition: Annotation.cs:12

System
Definition: Component.cs:11