mycaffe/html/_accuracy_encoding_layer_8cs_source.html

using System;

using System.Collections.Generic;

using System.Linq;

using System.Text;

using MyCaffe.basecode;

using MyCaffe.common;

using MyCaffe.param;


namespace MyCaffe.layers.beta

{

    public class AccuracyEncodingLayer<T> : Layer<T>

    {

        int m_nCacheSize = 100;

        int m_nNum = 0;

        int m_nEncodingDim = 0;

        Blob<T> m_blobEncodings;

        Blob<T> m_blobData;

        Blob<T> m_blobDistSq;

        Blob<T> m_blobSummerVec;

        Dictionary<int, int> m_rgLabelCounts = new Dictionary<int, int>();


        public AccuracyEncodingLayer(CudaDnn<T> cuda, Log log, LayerParameter p)

            : base(cuda, log, p)

        {

            m_type = LayerParameter.LayerType.ACCURACY_ENCODING;

            m_blobEncodings = new Blob<T>(cuda, log);

            m_blobEncodings.Name = m_param.name + " encodings";

            m_blobDistSq = new Blob<T>(cuda, log, false);

            m_blobDistSq.Name = m_param.name + " distsq";

            m_blobSummerVec = new Blob<T>(cuda, log, false);

            m_blobSummerVec.Name = m_param.name + " sum";

            m_blobData = new Blob<T>(cuda, log);

            m_blobData.Name = m_param.name + " data";

        }


        protected override void dispose()

        {

            dispose(ref m_blobEncodings);

            dispose(ref m_blobDistSq);

            dispose(ref m_blobSummerVec);

            dispose(ref m_blobData);


            base.dispose();

        }


        protected override void setup_internal_blobs(BlobCollection<T> col)

        {

            if (col.Count > 0)

                return;


            col.Add(m_blobEncodings);

            col.Add(m_blobDistSq);

            col.Add(m_blobSummerVec);

            col.Add(m_blobData);

        }


        public override int ExactNumBottomBlobs

        {

            get { return 2; }

        }


        public override int ExactNumTopBlobs

        {

            get { return 1; }

        }


        public override void LayerSetUp(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            m_log.CHECK_EQ((int)m_param.accuracy_param.top_k, 1, "Accuracy Encoding Layer only supports a topk = 1.");

            m_log.CHECK_EQ((int)m_param.accuracy_param.axis, 1, "Accuracy Encoding Layer expects axis to = 1.");


            if (m_param.accuracy_param.ignore_labels.Count > 0)

                m_log.WriteLine("WARNING: The Accuracy Encoding Layer does not use the 'ignore_label' parameter.");


            m_nCacheSize = m_param.decode_param.cache_size;

            m_log.CHECK_GT(m_nCacheSize, 0, "The cache size must be > 0.");


            if (m_colBlobs.Count == 0)

            {

                Blob<T> blobCentroids = new Blob<T>(m_cuda, m_log, false);

                blobCentroids.Name = m_param.name + " centroids";

                blobCentroids.reshape_when_sharing = true;


                List<int> rgCentroidShape = new List<int>() { 0 }; // skip size check.

                if (!shareParameter(blobCentroids, rgCentroidShape))

                {

                    blobCentroids.Reshape(2, m_nEncodingDim, 1, 1); // set to at least two labels initially (may get expanded in forward).

                    blobCentroids.SetData(0);

                }


                m_colBlobs.Add(blobCentroids);

            }

        }


        public override void Reshape(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            int nNum = colBottom[0].num;

            bool bFirstReshape = (nNum != m_nNum) ? true : false;

            m_nNum = nNum;

            m_nEncodingDim = colBottom[0].channels;


            m_log.CHECK_EQ(colBottom[1].num, m_nNum, "The number of labels does not match the number of items at bottom[0].");


            List<int> rgTopShape = new List<int>(); // Accuracy is a scalar; 0 axes.

            colTop[0].Reshape(rgTopShape);

            colTop[0].type = BLOB_TYPE.ACCURACY;


            // vector of ones used to sum along channels.

            m_blobSummerVec.Reshape(colBottom[0].channels, 1, 1, 1);

            m_blobSummerVec.SetData(1.0);

        }


        protected override void forward(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            m_log.CHECK_EQ(colBottom[1].count() % 2, 0, "The bottom[1] count must be a factor of 2 for {lbl1, lbl2}.");

            int nItemNum = colBottom[0].num;

            int nItemCount = nItemNum * m_param.decode_param.cache_size;

            double dfAlpha = 1.0 / (double)nItemCount;


            double dfAccuracy = 0;

            double[] rgBottomLabel = convertD(colBottom[1].update_cpu_data());

            int nCorrectCount = 0;

            int nComparedCount = 0;


            int nMaxLabel = rgBottomLabel.Max(p => (int)p);

            int nMaxKey = (m_rgLabelCounts.Count == 0) ? 0 : m_rgLabelCounts.Max(p => p.Key);

            if (nMaxLabel > nMaxKey)

            {

                int nNumLabels = nMaxLabel + 1;


                m_colBlobs[0].Reshape(nNumLabels, m_nEncodingDim, 1, 1);

                m_colBlobs[0].SetData(0);

                m_blobData.Reshape(nNumLabels, m_nEncodingDim, 1, 1);

                m_blobDistSq.Reshape(nNumLabels, 1, 1, 1);

                m_rgLabelCounts.Clear();

            }


            for (int i = 0; i < colBottom[0].num; i++)

            {

                int nLabel = (int)rgBottomLabel[i * 2]; // Only the first embedding and first label are used (second is ignored).

                int nLabelItemCount = 0;


                if (m_rgLabelCounts.ContainsKey(nLabel))

                    nLabelItemCount = m_rgLabelCounts[nLabel];


                // Create the centroid when counts fall between Centroid Start and Centroid End by

                // averaging all items within these counts together to create the centroid.

                if (nLabelItemCount == 0)

                {

                    // Add initial centroid portion for the label.

                    m_cuda.copy(m_nEncodingDim, colBottom[0].gpu_data, m_colBlobs[0].mutable_gpu_data, i * m_nEncodingDim, nLabel * m_nEncodingDim);

                    m_cuda.scale(m_nEncodingDim, convert(dfAlpha), m_colBlobs[0].gpu_data, m_colBlobs[0].mutable_gpu_data, nLabel * m_nEncodingDim, nLabel * m_nEncodingDim);

                }

                else if (nLabelItemCount < nItemCount)

                {

                    dfAlpha = 1.0 / (nLabelItemCount + 1);

                    // Add portion of current item to centroids for the label.

                    m_cuda.add(m_nEncodingDim, colBottom[0].gpu_data, m_colBlobs[0].gpu_data, m_colBlobs[0].mutable_gpu_data, dfAlpha, 1.0 - dfAlpha, i * m_nEncodingDim, nLabel * m_nEncodingDim, nLabel * m_nEncodingDim);

                }

                else

                {

                    // Add portion of current item to centroids for the label.

                    m_cuda.add(m_nEncodingDim, colBottom[0].gpu_data, m_colBlobs[0].gpu_data, m_colBlobs[0].mutable_gpu_data, dfAlpha, 1.0 - dfAlpha, i * m_nEncodingDim, nLabel * m_nEncodingDim, nLabel * m_nEncodingDim);

                }


                m_colBlobs[0].snapshot_requested = true;


                if (!m_rgLabelCounts.ContainsKey(nLabel))

                    m_rgLabelCounts.Add(nLabel, 1);

                else

                    m_rgLabelCounts[nLabel]++;


                // Load data with the current data embedding across each label 'slot' in blobData.

                int nCount = m_blobData.count();

                int nItems = m_blobData.num;

                m_cuda.fill(nItems, m_nEncodingDim, colBottom[0].gpu_data, i * m_nEncodingDim, nCount, m_blobData.mutable_gpu_data);


                m_cuda.sub(nCount,

                           m_blobData.gpu_data,              // a

                           m_colBlobs[0].gpu_data,           // b (centroid)

                           m_blobData.mutable_gpu_diff);     // a_i - b_i


                m_cuda.powx(nCount,

                           m_blobData.gpu_diff,              // a_i - b_i

                           2.0,

                           m_blobData.mutable_gpu_diff);     // (a_i - b_i)^2


                m_cuda.gemv(false,

                           m_blobData.num,                   // label count.

                           m_blobData.channels,              // encoding size.

                           1.0,

                           m_blobData.gpu_diff,              // (a_i - b_i)^2

                           m_blobSummerVec.gpu_data,

                           0.0,

                           m_blobDistSq.mutable_gpu_data);   // \Sum (a_i - b_i)^2


                // The label with the smallest distance is the detected label.

                double[] rgLabelDist = convertD(m_blobDistSq.mutable_cpu_data);

                int nDetectedLabel = -1;

                double dfMin = double.MaxValue;


                for (int l = 0; l < rgLabelDist.Length; l++)

                {

                    if (rgLabelDist[l] < dfMin)

                    {

                        dfMin = rgLabelDist[l];

                        nDetectedLabel = l;

                    }

                }


                if (nDetectedLabel == nLabel)

                    nCorrectCount++;


                nComparedCount++;

            }


            dfAccuracy = (nComparedCount == 0) ? 0 : (double)nCorrectCount / nComparedCount;


            colTop[0].SetData(dfAccuracy, 0);

            colTop[0].Tag = m_param.accuracy_param.top_k;

        }


        protected override void backward(BlobCollection<T> colTop, List<bool> rgbPropagateDown, BlobCollection<T> colBottom)

        {

            // do nothing.

        }

    }

}

MyCaffe.basecode.Log
The Log class provides general output in text form.
Definition: Log.cs:13

MyCaffe.basecode.Log.WriteLine
void WriteLine(string str, bool bOverrideEnabled=false, bool bHeader=false, bool bError=false, bool bDisable=false)
Write a line of output.
Definition: Log.cs:80

MyCaffe.basecode.Log.CHECK_EQ
void CHECK_EQ(double df1, double df2, string str)
Test whether one number is equal to another.
Definition: Log.cs:239

MyCaffe.basecode.Log.CHECK_GT
void CHECK_GT(double df1, double df2, string str)
Test whether one number is greater than another.
Definition: Log.cs:299

MyCaffe.common.BlobCollection
The BlobCollection contains a list of Blobs.
Definition: BlobCollection.cs:16

MyCaffe.common.BlobCollection.Add
void Add(Blob< T > b)
Add a new Blob to the collection.
Definition: BlobCollection.cs:92

MyCaffe.common.BlobCollection.SetData
void SetData(double df)
Set all blob data to the value specified.
Definition: BlobCollection.cs:323

MyCaffe.common.BlobCollection.Count
int Count
Returns the number of items in the collection.
Definition: BlobCollection.cs:30

MyCaffe.common.BlobCollection.Reshape
void Reshape(int[] rgShape)
Reshapes all blobs in the collection to the given shape.
Definition: BlobCollection.cs:238

MyCaffe.common.Blob
The Blob is the main holder of data that moves through the Layers of the Net.
Definition: Blob.cs:25

MyCaffe.common.Blob.channels
int channels
DEPRECIATED; legacy shape accessor channels: use shape(1) instead.
Definition: Blob.cs:800

MyCaffe.common.Blob.SetData
void SetData(T[] rgData, int nCount=-1, bool bSetCount=true)
Sets a number of items within the Blob's data.
Definition: Blob.cs:1922

MyCaffe.common.Blob.mutable_gpu_diff
long mutable_gpu_diff
Returns the diff GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1555

MyCaffe.common.Blob.mutable_gpu_data
long mutable_gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1487

MyCaffe.common.Blob.mutable_cpu_data
T[] mutable_cpu_data
Get data from the GPU and bring it over to the host, or Set data from the Host and send it over to th...
Definition: Blob.cs:1461

MyCaffe.common.Blob.Reshape
void Reshape(int nNum, int nChannels, int nHeight, int nWidth, bool? bUseHalfSize=null)
DEPRECIATED; use
Definition: Blob.cs:442

MyCaffe.common.Blob.reshape_when_sharing
bool reshape_when_sharing
When true, this Blob is reshaped to the source when sharing the source data (default = false).
Definition: Blob.cs:1803

MyCaffe.common.Blob.count
int count()
Returns the total number of items in the Blob.
Definition: Blob.cs:739

MyCaffe.common.Blob.Name
string Name
Get/set the name of the Blob.
Definition: Blob.cs:2184

MyCaffe.common.Blob.gpu_diff
long gpu_diff
Returns the diff GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1541

MyCaffe.common.Blob.num
int num
DEPRECIATED; legacy shape accessor num: use shape(0) instead.
Definition: Blob.cs:792

MyCaffe.common.Blob.gpu_data
long gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1479

MyCaffe.common.CudaDnn
The CudaDnn object is the main interface to the Low-Level Cuda C++ DLL.
Definition: CudaDnn.cs:969

MyCaffe.layers.Layer
An interface for the units of computation which can be composed into a Net.
Definition: Layer.cs:31

MyCaffe.layers.Layer.m_log
Log m_log
Specifies the Log for output.
Definition: Layer.cs:43

MyCaffe.layers.Layer.m_param
LayerParameter m_param
Specifies the LayerParameter describing the Layer.
Definition: Layer.cs:47

MyCaffe.layers.Layer.convert
void convert(BlobCollection< T > col)
Convert a collection of blobs from / to half size.
Definition: Layer.cs:535

MyCaffe.layers.Layer.shareParameter
bool shareParameter(Blob< T > b, List< int > rgMinShape, bool bAllowEndsWithComparison=false)
Attempts to share a parameter Blob if another parameter Blob with the same name and accpetable size i...
Definition: Layer.cs:1152

MyCaffe.layers.Layer.convertD
double convertD(T df)
Converts a generic to a double value.
Definition: Layer.cs:1349

MyCaffe.layers.Layer.m_cuda
CudaDnn< T > m_cuda
Specifies the CudaDnn connection to Cuda.
Definition: Layer.cs:39

MyCaffe.layers.Layer.m_type
LayerParameter.LayerType m_type
Specifies the Layer type.
Definition: Layer.cs:35

MyCaffe.layers.Layer.m_colBlobs
BlobCollection< T > m_colBlobs
Specifies the learnable parameter Blobs of the Layer.
Definition: Layer.cs:55

MyCaffe.layers.beta.AccuracyEncodingLayer
The AccuracyEncodingLayer computes the classification accuracy for an encoding used in a classificati...
Definition: AccuracyEncodingLayer.cs:19

MyCaffe.layers.beta.AccuracyEncodingLayer.forward
override void forward(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Forward compuation.
Definition: AccuracyEncodingLayer.cs:168

MyCaffe.layers.beta.AccuracyEncodingLayer.Reshape
override void Reshape(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Reshape the bottom (input) and top (output) blobs.
Definition: AccuracyEncodingLayer.cs:131

MyCaffe.layers.beta.AccuracyEncodingLayer.AccuracyEncodingLayer
AccuracyEncodingLayer(CudaDnn< T > cuda, Log log, LayerParameter p)
Constructor.
Definition: AccuracyEncodingLayer.cs:40

MyCaffe.layers.beta.AccuracyEncodingLayer.ExactNumTopBlobs
override int ExactNumTopBlobs
Returns the number of top blobs: accuracy
Definition: AccuracyEncodingLayer.cs:89

MyCaffe.layers.beta.AccuracyEncodingLayer.dispose
override void dispose()
Releases all GPU and host resources used by the Layer.
Definition: AccuracyEncodingLayer.cs:55

MyCaffe.layers.beta.AccuracyEncodingLayer.setup_internal_blobs
override void setup_internal_blobs(BlobCollection< T > col)
Derivative layers should add all internal blobws to the 'col' provided.
Definition: AccuracyEncodingLayer.cs:66

MyCaffe.layers.beta.AccuracyEncodingLayer.backward
override void backward(BlobCollection< T > colTop, List< bool > rgbPropagateDown, BlobCollection< T > colBottom)
Not implemented – EncodingAccuracyLayer cannot be used as a loss.
Definition: AccuracyEncodingLayer.cs:279

MyCaffe.layers.beta.AccuracyEncodingLayer.ExactNumBottomBlobs
override int ExactNumBottomBlobs
Returns the number of bottom blobs used: predicted, label
Definition: AccuracyEncodingLayer.cs:81

MyCaffe.layers.beta.AccuracyEncodingLayer.LayerSetUp
override void LayerSetUp(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Setup the layer.
Definition: AccuracyEncodingLayer.cs:98

MyCaffe.param.AccuracyParameter.top_k
uint top_k
When computing accuracy, count as correct by comparing the true label to the top_k scoring classes....
Definition: AccuracyParameter.cs:58

MyCaffe.param.AccuracyParameter.ignore_labels
List< int > ignore_labels
If specified, ignore instances with the given label(s).
Definition: AccuracyParameter.cs:82

MyCaffe.param.AccuracyParameter.axis
int axis
The 'label' axis of the prediction blob, whos argmax corresponds to the predicted label – may be nega...
Definition: AccuracyParameter.cs:72

MyCaffe.param.LayerParameter
Specifies the base parameter for all layers.
Definition: LayerParameter.cs:24

MyCaffe.param.LayerParameter.name
string name
Specifies the name of this LayerParameter.
Definition: LayerParameter.cs:1865

MyCaffe.param.LayerParameter.accuracy_param
AccuracyParameter accuracy_param
Returns the parameter set when initialized with LayerType.ACCURACY
Definition: LayerParameter.cs:2036

MyCaffe.param.LayerParameter.decode_param
DecodeParameter decode_param
Returns the parameter set when initializing with LayerType.DECODE or LayerType.ACCURACY_ENCODING;
Definition: LayerParameter.cs:2153

MyCaffe.param.LayerParameter.LayerType
LayerType
Specifies the layer type.
Definition: LayerParameter.cs:110

MyCaffe.basecode
The MyCaffe.basecode contains all generic types used throughout MyCaffe.
Definition: Annotation.cs:12

MyCaffe.common
The MyCaffe.common namespace contains common MyCaffe classes.
Definition: BatchInput.cs:8

MyCaffe.common.BLOB_TYPE
BLOB_TYPE
Defines the tpe of data held by a given Blob.
Definition: Interfaces.cs:62

MyCaffe.layers.beta
The MyCaffe.layers.beta namespace contains all beta stage layers.
Definition: LayerFactory.cs:9

MyCaffe.param
The MyCaffe.param namespace contains parameters used to create models.
Definition: AttentionParameter.cs:9

MyCaffe
The MyCaffe namespace contains the main body of MyCaffe code that closesly tracks the C++ Caffe open-...
Definition: Annotation.cs:12

System
Definition: Component.cs:11