mycaffe/html/_triplet_loss_layer_8cs_source.html

using System;

using System.Collections.Generic;

using System.Linq;

using System.Text;

using MyCaffe.basecode;

using MyCaffe.common;

using MyCaffe.param;


namespace MyCaffe.layers.beta

{

    public class TripletLossLayer<T> : LossLayer<T>

    {

        Blob<T> m_blobDiffAP;

        Blob<T> m_blobDiffSqAP;

        Blob<T> m_blobDistSqAP;

        Blob<T> m_blobDiffAN;

        Blob<T> m_blobDiffSqAN;

        Blob<T> m_blobDistSqAN;

        Blob<T> m_blobDiffPN;

        Blob<T> m_blobSumVec;

        Blob<T> m_blobLossVec;

        Blob<T> m_blobWork;

        Blob<T> m_blobPreGenTargetsPos;

        Blob<T> m_blobPreGenTargetsNeg;

        double m_dfAlpha;


        public TripletLossLayer(CudaDnn<T> cuda, Log log, LayerParameter p)

            : base(cuda, log, p)

        {

            m_type = LayerParameter.LayerType.TRIPLET_LOSS;


            m_blobDiffAP = new Blob<T>(m_cuda, m_log);

            m_blobDiffAP.Name = m_param.name + ".positive delta";


            m_blobDiffSqAP = new Blob<T>(m_cuda, m_log, false);

            m_blobDiffSqAP.Name = m_param.name + ".positive delta sq";


            m_blobDistSqAP = new Blob<T>(m_cuda, m_log, false);

            m_blobDistSqAP.Name = m_param.name + ".positive dist sq";


            m_blobDiffAN = new Blob<T>(m_cuda, m_log);

            m_blobDiffAN.Name = m_param.name + ".negative delta";


            m_blobDiffSqAN = new Blob<T>(m_cuda, m_log, false);

            m_blobDiffSqAN.Name = m_param.name + ".negative delta sq";


            m_blobDistSqAN = new Blob<T>(m_cuda, m_log, false);

            m_blobDistSqAN.Name = m_param.name + ".negative dist sq";


            m_blobDiffPN = new Blob<T>(m_cuda, m_log);

            m_blobDiffPN.Name = m_param.name + ".pos/neg delta";


            m_blobSumVec = new Blob<T>(m_cuda, m_log, false);

            m_blobSumVec.Name = m_param.name + ".summer vec";


            m_blobLossVec = new Blob<T>(m_cuda, m_log, false);

            m_blobLossVec.Name = m_param.name + ".loss vec";


            m_blobWork = new Blob<T>(m_cuda, m_log);

            m_blobWork.Name = m_param.name + ".work";

        }


        protected override void dispose()

        {

            if (m_blobDiffAP != null)

            {

                m_blobDiffAP.Dispose();

                m_blobDiffAP = null;

            }


            if (m_blobDiffSqAP != null)

            {

                m_blobDiffSqAP.Dispose();

                m_blobDiffSqAP = null;

            }


            if (m_blobDistSqAP != null)

            {

                m_blobDistSqAP.Dispose();

                m_blobDistSqAP = null;

            }


            if (m_blobDiffAN != null)

            {

                m_blobDiffAN.Dispose();

                m_blobDiffAN = null;

            }


            if (m_blobDiffSqAN != null)

            {

                m_blobDiffSqAN.Dispose();

                m_blobDiffSqAN = null;

            }


            if (m_blobDistSqAN != null)

            {

                m_blobDistSqAN.Dispose();

                m_blobDistSqAN = null;

            }


            if (m_blobDiffPN != null)

            {

                m_blobDiffPN.Dispose();

                m_blobDiffPN = null;

            }


            if (m_blobSumVec != null)

            {

                m_blobSumVec.Dispose();

                m_blobSumVec = null;

            }


            if (m_blobLossVec != null)

            {

                m_blobLossVec.Dispose();

                m_blobLossVec = null;

            }


            if (m_blobWork != null)

            {

                m_blobWork.Dispose();

                m_blobWork = null;

            }


            if (m_blobPreGenTargetsPos != null)

            {

                m_blobPreGenTargetsPos.Dispose();

                m_blobPreGenTargetsPos = null;

            }


            if (m_blobPreGenTargetsNeg != null)

            {

                m_blobPreGenTargetsNeg.Dispose();

                m_blobPreGenTargetsNeg = null;

            }


            base.dispose();

        }


        protected override void setup_internal_blobs(BlobCollection<T> col)

        {

            if (col.Count > 0)

                return;


            col.Add(m_blobDiffAP);

            col.Add(m_blobDiffSqAP);

            col.Add(m_blobDistSqAP);

            col.Add(m_blobDiffAN);

            col.Add(m_blobDiffSqAN);

            col.Add(m_blobDistSqAN);

            col.Add(m_blobDiffPN);

            col.Add(m_blobSumVec);

            col.Add(m_blobLossVec);

            col.Add(m_blobWork);


            if (m_blobPreGenTargetsPos != null)

                col.Add(m_blobPreGenTargetsPos);


            if (m_blobPreGenTargetsNeg != null)

                col.Add(m_blobPreGenTargetsNeg);

        }


        public override int ExactNumBottomBlobs

        {

            get { return -1; }

        }


        public override int MinBottomBlobs

        {

            get { return 4; } // anchor, positive, negative, label

        }


        public override int MaxBottomBlobs

        {

            get { return 5; } // anchor, positive, negative, label, cetroids (from decode layer)

        }


        public override int ExactNumTopBlobs

        {

            get { return 1; }

        }


        public override bool AllowForceBackward(int nBottomIdx)

        {

            if (nBottomIdx <= 2)

                return true;


            return false;

        }


        public override void LayerSetUp(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            base.LayerSetUp(colBottom, colTop);

            m_dfAlpha = m_param.triplet_loss_param.alpha;


            // If the fifth bottom exists (the centroids) initialize the pregen targets.

            if (colBottom.Count == 5)

            {

                m_blobPreGenTargetsNeg = new Blob<T>(m_cuda, m_log, false);

                m_blobPreGenTargetsNeg.Name = "pregen neg";

                m_blobPreGenTargetsPos = new Blob<T>(m_cuda, m_log);

                m_blobPreGenTargetsPos.Name = "pregen pos";

            }

        }


        public override void Reshape(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            base.Reshape(colBottom, colTop);


            m_log.CHECK(Utility.Compare<int>(colBottom[0].shape(), colBottom[1].shape()), "Inputs must have the same dimension.");

            m_log.CHECK(Utility.Compare<int>(colBottom[0].shape(), colBottom[2].shape()), "Inputs must have the same dimension.");


            m_blobDiffAP.ReshapeLike(colBottom[0]);

            m_blobDiffSqAP.ReshapeLike(colBottom[0]);

            m_blobDiffAN.ReshapeLike(colBottom[0]);

            m_blobDiffSqAN.ReshapeLike(colBottom[0]);

            m_blobDiffPN.ReshapeLike(colBottom[0]);

            m_blobLossVec.ReshapeLike(colBottom[0]);


            int nNum = colBottom[0].num;

            int nDim = colBottom[0].count(1);

            m_blobSumVec.Reshape(nDim, 1, 1, 1);

            m_blobSumVec.SetData(1.0);


            m_blobWork.Reshape(nNum, 1, 1, 1);

            m_blobWork.SetData(0.0);


            m_blobDistSqAP.ReshapeLike(m_blobWork);

            m_blobDistSqAN.ReshapeLike(m_blobWork);


            List<int> rgLossShape = new List<int>();    // Loss layers output a scalar, 0 axes.

            colTop[0].Reshape(rgLossShape);


            if (m_blobPreGenTargetsNeg != null)

                m_blobPreGenTargetsNeg.ReshapeLike(colBottom[0]);


            if (m_blobPreGenTargetsPos != null)

                m_blobPreGenTargetsPos.ReshapeLike(colBottom[0]);

        }


        public void loadPreGenTargets(Blob<T> lbl, Blob<T> tgt, Blob<T> tgtNeg, Blob<T> tgtPos)

        {

            float[] rgLabels = convertF(lbl.update_cpu_data());

            int nLblDim = lbl.count(1);

            int nLblNum = tgt.num;

            int nNum = lbl.num;

            int nDim = tgt.count(1);

            Random rand = new Random();

            List<int> rgLabelVals = new List<int>();

            Dictionary<int, List<int>> rgrgLabelSel = new Dictionary<int, List<int>>();


            for (int i = 0; i < tgt.num; i++)

            {

                rgLabelVals.Add(i + m_param.triplet_loss_param.pregen_label_start);

                rgrgLabelSel.Add(i + m_param.triplet_loss_param.pregen_label_start, new List<int>());

            }


            m_log.CHECK_EQ(nNum, tgtNeg.num, "The neg targets have an incorrect num!");

            m_log.CHECK_EQ(nNum, tgtPos.num, "The pos targets have an incorrect num!");

            m_log.CHECK_EQ(nDim, tgtNeg.count(1), "The neg targets have an incorrect dim!");

            m_log.CHECK_EQ(nDim, tgtPos.count(1), "The pos targets have an incorrect dim!");


            for (int i = 0; i < nNum; i++)

            {

                int nLabel = (int)rgLabels[i * nLblDim];


                // Copy the positive to match the anchor label.

                m_cuda.copy(nDim, tgt.gpu_data, tgtPos.mutable_gpu_data, nLabel * nDim, i * nDim);


                // Copy the negative to NOT match the anchor label.

                if (rgrgLabelSel[nLabel].Count == 0)

                {

                    for (int l = 0; l < rgLabelVals.Count; l++)

                    {

                        if (rgLabelVals[l] != nLabel)

                            rgrgLabelSel[nLabel].Add(rgLabelVals[l]);

                    }

                }


                int nLabelIdx = rand.Next(rgrgLabelSel[nLabel].Count);

                int nLabelX = rgrgLabelSel[nLabel][nLabelIdx];

                rgrgLabelSel[nLabel].Remove(nLabelX);


                m_cuda.copy(nDim, tgt.gpu_data, tgtNeg.mutable_gpu_data, nLabelX * nDim, i * nDim);

            }

        }


        protected override void forward(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            m_log.CHECK_GE(colBottom.Count, 4, "The bottom must have at least 4 items: anchor, positives, negatives and label.");

            int nCount = colBottom[0].count();

            int nNum = colBottom[0].num;

            int nDim = colBottom[0].count(1);

            long hAnchor = colBottom[0].gpu_data;

            long hPositive = colBottom[1].gpu_data;

            long hNegative = colBottom[2].gpu_data;


            m_blobWork.Reshape(nNum, 1, 1, 1);


            m_log.CHECK_EQ(colBottom.Count, 4, "Currently, external targts such as centroids are not supported.");

            //if (colBottom.Count == 5)

            //    loadPreGenTargets(colBottom[3], colBottom[4], m_blobPreGenTargetsNeg, m_blobPreGenTargetsPos);


            m_cuda.sub(nCount, hAnchor, hPositive, m_blobDiffAP.mutable_gpu_data);   // a_i - p_i

            m_cuda.sub(nCount, hAnchor, hNegative, m_blobDiffAN.mutable_gpu_data);   // a_i - n_i


            m_cuda.powx(nCount, m_blobDiffAP.gpu_data, 2.0, m_blobDiffSqAP.mutable_gpu_data); // (a_i - p_i)^2

            m_cuda.gemv(false, nNum, nDim, 1.0, m_blobDiffSqAP.gpu_data, m_blobSumVec.gpu_data, 0.0, m_blobDistSqAP.mutable_gpu_data); // \Sum (a_i - p_i)^2


            m_cuda.powx(nCount, m_blobDiffAN.gpu_data, 2.0, m_blobDiffSqAN.mutable_gpu_data); // (a_i - p_i)^2

            m_cuda.gemv(false, nNum, nDim, 1.0, m_blobDiffSqAN.gpu_data, m_blobSumVec.gpu_data, 0.0, m_blobDistSqAN.mutable_gpu_data); // \Sum (a_i - p_i)^2


            double dfMargin = m_dfAlpha;


            m_cuda.sub(nNum, m_blobDistSqAP.gpu_data, m_blobDistSqAN.gpu_data, m_blobWork.mutable_gpu_data);

            m_cuda.add_scalar(nNum, dfMargin, m_blobWork.mutable_gpu_data);

            m_cuda.set_bounds(nNum, 0, float.MaxValue, m_blobWork.mutable_gpu_data);

            m_cuda.copy_expand(nCount, nNum, nDim, m_blobWork.gpu_data, m_blobLossVec.mutable_gpu_data);

            m_cuda.sign(nCount, m_blobLossVec.gpu_data, m_blobLossVec.mutable_gpu_data);


            double dfLoss = m_cuda.asum_double(nNum, m_blobWork.gpu_data);

            dfLoss /= (nNum * 2.0);

            colTop[0].SetData(dfLoss, 0);

        }


        protected override void backward(BlobCollection<T> colTop, List<bool> rgbPropagateDown, BlobCollection<T> colBottom)

        {

            int nCount = colBottom[0].count();

            int nNum = colBottom[0].num;

            double dfDiff = convertD(colTop[0].GetDiff(0));

            double dfAlpha = dfDiff / (double)nNum;

            long hAnchor = colBottom[0].gpu_data;

            long hPositive = colBottom[1].gpu_data;

            long hNegative = colBottom[2].gpu_data;


            m_blobLossVec.scale_data(dfAlpha);


            if (rgbPropagateDown[0])

            {

                m_cuda.sub(nCount, hNegative, hPositive, m_blobDiffPN.mutable_gpu_diff);

                m_cuda.mul(nCount, m_blobLossVec.gpu_data, m_blobDiffPN.gpu_diff, colBottom[0].mutable_gpu_diff);

            }


            if (rgbPropagateDown[1])

            {

                m_cuda.sub(nCount, hPositive, hAnchor, m_blobDiffAP.mutable_gpu_diff);

                m_cuda.mul(nCount, m_blobLossVec.gpu_data, m_blobDiffAP.gpu_diff, colBottom[1].mutable_gpu_diff);

            }


            if (rgbPropagateDown[2])

            {

                m_cuda.sub(nCount, hAnchor, hNegative, m_blobDiffAN.mutable_gpu_diff);

                m_cuda.mul(nCount, m_blobLossVec.gpu_data, m_blobDiffAN.gpu_diff, colBottom[2].mutable_gpu_diff);

            }

        }

    }

}

MyCaffe.basecode.Log
The Log class provides general output in text form.
Definition: Log.cs:13

MyCaffe.basecode.Log.CHECK
void CHECK(bool b, string str)
Test a flag for true.
Definition: Log.cs:227

MyCaffe.basecode.Log.CHECK_EQ
void CHECK_EQ(double df1, double df2, string str)
Test whether one number is equal to another.
Definition: Log.cs:239

MyCaffe.basecode.Log.CHECK_GE
void CHECK_GE(double df1, double df2, string str)
Test whether one number is greater than or equal to another.
Definition: Log.cs:287

MyCaffe.basecode.Utility
The Utility class provides general utility funtions.
Definition: Utility.cs:35

MyCaffe.common.BlobCollection
The BlobCollection contains a list of Blobs.
Definition: BlobCollection.cs:16

MyCaffe.common.BlobCollection.Add
void Add(Blob< T > b)
Add a new Blob to the collection.
Definition: BlobCollection.cs:92

MyCaffe.common.BlobCollection.SetData
void SetData(double df)
Set all blob data to the value specified.
Definition: BlobCollection.cs:323

MyCaffe.common.BlobCollection.Count
int Count
Returns the number of items in the collection.
Definition: BlobCollection.cs:30

MyCaffe.common.BlobCollection.Reshape
void Reshape(int[] rgShape)
Reshapes all blobs in the collection to the given shape.
Definition: BlobCollection.cs:238

MyCaffe.common.Blob
The Blob is the main holder of data that moves through the Layers of the Net.
Definition: Blob.cs:25

MyCaffe.common.Blob.SetData
void SetData(T[] rgData, int nCount=-1, bool bSetCount=true)
Sets a number of items within the Blob's data.
Definition: Blob.cs:1922

MyCaffe.common.Blob.mutable_gpu_diff
long mutable_gpu_diff
Returns the diff GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1555

MyCaffe.common.Blob.mutable_gpu_data
long mutable_gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1487

MyCaffe.common.Blob.Reshape
void Reshape(int nNum, int nChannels, int nHeight, int nWidth, bool? bUseHalfSize=null)
DEPRECIATED; use
Definition: Blob.cs:442

MyCaffe.common.Blob.scale_data
void scale_data(double df)
Scale the data by a scaling factor.
Definition: Blob.cs:1754

MyCaffe.common.Blob.update_cpu_data
T[] update_cpu_data()
Update the CPU data by transferring the GPU data over to the Host.
Definition: Blob.cs:1470

MyCaffe.common.Blob.count
int count()
Returns the total number of items in the Blob.
Definition: Blob.cs:739

MyCaffe.common.Blob.ReshapeLike
void ReshapeLike(Blob< T > b, bool? bUseHalfSize=null)
Reshape this Blob to have the same shape as another Blob.
Definition: Blob.cs:648

MyCaffe.common.Blob.Name
string Name
Get/set the name of the Blob.
Definition: Blob.cs:2184

MyCaffe.common.Blob.gpu_diff
long gpu_diff
Returns the diff GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1541

MyCaffe.common.Blob.Dispose
virtual void Dispose(bool bDisposing)
Releases all resources used by the Blob (including both GPU and Host).
Definition: Blob.cs:402

MyCaffe.common.Blob.num
int num
DEPRECIATED; legacy shape accessor num: use shape(0) instead.
Definition: Blob.cs:792

MyCaffe.common.Blob.gpu_data
long gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1479

MyCaffe.common.CudaDnn
The CudaDnn object is the main interface to the Low-Level Cuda C++ DLL.
Definition: CudaDnn.cs:969

MyCaffe.layers.Layer.m_log
Log m_log
Specifies the Log for output.
Definition: Layer.cs:43

MyCaffe.layers.Layer.m_param
LayerParameter m_param
Specifies the LayerParameter describing the Layer.
Definition: Layer.cs:47

MyCaffe.layers.Layer.convertF
float convertF(T df)
Converts a generic to a float value.
Definition: Layer.cs:1359

MyCaffe.layers.Layer.convertD
double convertD(T df)
Converts a generic to a double value.
Definition: Layer.cs:1349

MyCaffe.layers.Layer.m_cuda
CudaDnn< T > m_cuda
Specifies the CudaDnn connection to Cuda.
Definition: Layer.cs:39

MyCaffe.layers.Layer.m_type
LayerParameter.LayerType m_type
Specifies the Layer type.
Definition: Layer.cs:35

MyCaffe.layers.LossLayer
The LossLayer provides an interface for Layer's that take two blobs as input – usually (1) prediction...
Definition: LossLayer.cs:23

MyCaffe.layers.beta.TripletLossLayer
TripletLoss Layer - this is the triplet loss layer used to calculate the triplet loss and gradients u...
Definition: TripletLossLayer.cs:42

MyCaffe.layers.beta.TripletLossLayer.backward
override void backward(BlobCollection< T > colTop, List< bool > rgbPropagateDown, BlobCollection< T > colBottom)
Computes the error gradient w.r.t the inputs.
Definition: TripletLossLayer.cs:434

MyCaffe.layers.beta.TripletLossLayer.TripletLossLayer
TripletLossLayer(CudaDnn< T > cuda, Log log, LayerParameter p)
The TripletLossLayer constructor.
Definition: TripletLossLayer.cs:64

MyCaffe.layers.beta.TripletLossLayer.LayerSetUp
override void LayerSetUp(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Setup the layer.
Definition: TripletLossLayer.cs:252

MyCaffe.layers.beta.TripletLossLayer.ExactNumBottomBlobs
override int ExactNumBottomBlobs
Returns the exact number of bottom blobs which are variable so -1 is returned.
Definition: TripletLossLayer.cs:206

MyCaffe.layers.beta.TripletLossLayer.MinBottomBlobs
override int MinBottomBlobs
Returns the minimum number of bottom blobs: anchor, positive, negative, label
Definition: TripletLossLayer.cs:214

MyCaffe.layers.beta.TripletLossLayer.Reshape
override void Reshape(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Reshape the bottom (input) and top (output) blobs.
Definition: TripletLossLayer.cs:272

MyCaffe.layers.beta.TripletLossLayer.AllowForceBackward
override bool AllowForceBackward(int nBottomIdx)
Returns true for all but the labels, for we want the loss value to be propagated back.
Definition: TripletLossLayer.cs:239

MyCaffe.layers.beta.TripletLossLayer.setup_internal_blobs
override void setup_internal_blobs(BlobCollection< T > col)
Derivative layers should add all internal blobws to the 'col' provided.
Definition: TripletLossLayer.cs:179

MyCaffe.layers.beta.TripletLossLayer.MaxBottomBlobs
override int MaxBottomBlobs
Returns the maximum number of bottom blobs: anchor, positive, negative, label, centroids (from decode...
Definition: TripletLossLayer.cs:222

MyCaffe.layers.beta.TripletLossLayer.forward
override void forward(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Computes the forward calculation.
Definition: TripletLossLayer.cs:379

MyCaffe.layers.beta.TripletLossLayer.ExactNumTopBlobs
override int ExactNumTopBlobs
Returns the exact number of required top (output) Blobs: loss
Definition: TripletLossLayer.cs:230

MyCaffe.layers.beta.TripletLossLayer.loadPreGenTargets
void loadPreGenTargets(Blob< T > lbl, Blob< T > tgt, Blob< T > tgtNeg, Blob< T > tgtPos)
Loads the pre-gen targets, only made public for testing.
Definition: TripletLossLayer.cs:314

MyCaffe.layers.beta.TripletLossLayer.dispose
override void dispose()
Releases all GPU and host resources used by the Layer.
Definition: TripletLossLayer.cs:101

MyCaffe.param.LayerParameter
Specifies the base parameter for all layers.
Definition: LayerParameter.cs:24

MyCaffe.param.LayerParameter.name
string name
Specifies the name of this LayerParameter.
Definition: LayerParameter.cs:1865

MyCaffe.param.LayerParameter.triplet_loss_param
TripletLossParameter triplet_loss_param
Returns the parameter set when initialized with LayerType.TRIPLET_LOSS
Definition: LayerParameter.cs:2912

MyCaffe.param.LayerParameter.LayerType
LayerType
Specifies the layer type.
Definition: LayerParameter.cs:110

MyCaffe.basecode
The MyCaffe.basecode contains all generic types used throughout MyCaffe.
Definition: Annotation.cs:12

MyCaffe.common
The MyCaffe.common namespace contains common MyCaffe classes.
Definition: BatchInput.cs:8

MyCaffe.layers.beta
The MyCaffe.layers.beta namespace contains all beta stage layers.
Definition: LayerFactory.cs:9

MyCaffe.param
The MyCaffe.param namespace contains parameters used to create models.
Definition: AttentionParameter.cs:9

MyCaffe
The MyCaffe namespace contains the main body of MyCaffe code that closesly tracks the C++ Caffe open-...
Definition: Annotation.cs:12

System
Definition: Component.cs:11