mycaffe/html/_blob_8cs_source.html

using System;

using System.Collections.Generic;

using System.Linq;

using System.Text;

using System.IO;

using System.Threading;

using System.Diagnostics;

using System.Drawing;

using MyCaffe.param;

using MyCaffe.basecode;

using System.Drawing.Text;


namespace MyCaffe.common

{

    public class Blob<T> : IDisposable

    {

        T m_tZero;

        T m_tMinusOne;

        string m_strName = "";

        CudaDnn<T> m_cuda;

        Log m_log;

        bool m_bIncludeDiff = true;

        bool m_bOwnData = true;

        SyncedMemory<T> m_data = null;

        bool m_bOwnDiff = true;

        SyncedMemory<T> m_diff = null;

        bool m_bOwnShape = true;

        SyncedMemory<T> m_shape = null;

        int m_nCount = 0;

        int m_nCapacity = 0;

        List<int> m_rgShape = new List<int>();

        int m_nIdx = -1;

        BLOB_TYPE m_type = BLOB_TYPE.DATA;

        object m_tag = null;

        bool m_bFreezeLearning = false;

        bool m_bCpuDataReadyForPush = false;

        bool m_bReshapeWhenSharing = false;

        bool m_bSnapshotRequested = false;

        bool m_bPadded = false;

        Dictionary<string, double> m_rgParam = new Dictionary<string, double>();

        int[] m_rgShape1 = new int[4] { 1, 1, 1, 1 };


        public const int MAX_BLOB_AXES = 32;


        public Blob(CudaDnn<T> cuda, Log log, bool bIncludeDiff = true, bool bUseHalfSize = false)

        {

            if (bUseHalfSize && typeof(T) != typeof(float))

            {

                bUseHalfSize = false;


                if (log != null)

                    log.WriteLine("WARNING: Half sizes currently only supported with the 'float' base type - changing back to full size.");

            }


            m_tZero = Zero;

            m_tMinusOne = MinusOne;

            m_bIncludeDiff = bIncludeDiff;

            m_cuda = cuda;

            m_log = log;

            m_shape = new SyncedMemory<T>(m_cuda, m_log);

            m_data = new SyncedMemory<T>(m_cuda, m_log, 0, null, bUseHalfSize);


            if (m_bIncludeDiff)

                m_diff = new SyncedMemory<T>(m_cuda, m_log, 0, null, bUseHalfSize);

        }


        public Blob(CudaDnn<T> cuda, Log log, int nNum, int nChannels, int nHeight, int nWidth, bool bIncludeDiff = true, bool bUseHalfSize = false)

            : this(cuda, log, bIncludeDiff, bUseHalfSize)

        {

            // Capacity must be initialized before calling Reshape.

            m_nCapacity = 0;

            Reshape(nNum, nChannels, nHeight, nWidth);

        }


        public Blob(CudaDnn<T> cuda, Log log, List<int> rgShape, bool bIncludeDiff = true, bool bUseHalfSize = false)

            : this(cuda, log, bIncludeDiff, bUseHalfSize)

        {

            // Capacity must be initialized before calling Reshape.

            m_nCapacity = 0;

            Reshape(rgShape);

        }


        public Blob(CudaDnn<T> cuda, Log log, int[] rgShape, bool bIncludeDiff = true, bool bUseHalfSize = false)

            : this(cuda, log, bIncludeDiff, bUseHalfSize)

        {

            // Capacity must be initialized before calling Reshape.

            m_nCapacity = 0;

            Reshape(rgShape);

        }


        public Blob(CudaDnn<T> cuda, Log log, Blob<T> b, bool bUseHalfSize = false)

            : this(cuda, log, (b.m_diff != null) ? true : false, bUseHalfSize)

        {

            // Capacity must be initialized before calling Reshape.

            m_nCapacity = 0;

            ReshapeLike(b);

        }


        public Blob(CudaDnn<T> cuda, Log log, SimpleDatum d, bool bCopyData = false, bool bIncludeDiff = true, bool bUseHalfSize = false)

            : this(cuda, log, bIncludeDiff, bUseHalfSize)

        {

            SetData(d, true, bCopyData);

        }


        public Blob(CudaDnn<T> cuda, Log log, BlobProto bp, bool bUseHalfSize = false)

            : this(cuda, log, true, bUseHalfSize)

        {

            FromProto(bp);

        }


        public Blob(Blob<T> blob, long lCount, long lOffset)

            : this(blob.Cuda, blob.Log, blob.m_bIncludeDiff)

        {

            m_data.set_gpu_data(blob.gpu_data, lCount, lOffset);


            if (m_diff != null)

                m_diff.set_gpu_data(blob.gpu_diff, lCount, lOffset);

        }


        public void Unsqueeze(int nNumAxes)

        {

            if (num_axes < 4)

            {

                List<int> rgShape = Utility.Clone<int>(shape());

                for (int i = rgShape.Count; i < 4; i++)

                {

                    rgShape.Add(1);

                }


                Reshape(rgShape);

            }

        }


        public double? GetParameter(string strName)

        {

            if (m_rgParam.ContainsKey(strName))

                return m_rgParam[strName];


            return null;

        }


        public void SetParameter(string strName, double dfVal)

        {

            if (!m_rgParam.ContainsKey(strName))

                m_rgParam.Add(strName, dfVal);

            else

                m_rgParam[strName] = dfVal;

        }


        public void CopyParameters(Blob<T> b)

        {

            foreach (KeyValuePair<string, double> kv in b.m_rgParam)

            {

                if (!m_rgParam.ContainsKey(kv.Key))

                    m_rgParam.Add(kv.Key, kv.Value);

                else

                    m_rgParam[kv.Key] = kv.Value;

            }

        }


        public static T Zero

        {

            get { return (T)Convert.ChangeType(0, typeof(T)); }

        }


        public static T One

        {

            get { return (T)Convert.ChangeType(1, typeof(T)); }

        }


        public static T MinusOne

        {

            get { return (T)Convert.ChangeType(-1, typeof(T)); }

        }


        public bool Padded

        {

            get { return m_bPadded; }

            set { m_bPadded = value; }

        }


        public ulong GetConversionWorkSize(bool bUseHalfSize)

        {

            // (count (for data) + count (for diff)) * base type size

            return (ulong)count() * 2 * CudaDnn<T>.basetype_size(bUseHalfSize);

        }


        public void ConvertToHalf(long hWorkMem, ulong lWorkSize, bool bData, bool bDiff)

        {

            int nCount = count();

            ulong lSize = (ulong)nCount * 2 * CudaDnn<T>.basetype_size(true);


            if ((long)lSize < 0)

                throw new Exception("Memory out of range!");


            if (lWorkSize < lSize)

                throw new Exception("Work memory is not large enough!");


            if (bData)

                m_cuda.copy(nCount, gpu_data, hWorkMem, 0, 0, -1, null, true);


            if (bDiff)

                m_cuda.copy(nCount, gpu_diff, hWorkMem, 0, nCount, -1, null, true);


            Reshape(shape(), true);


            if (bData)

                m_cuda.copy(nCount, hWorkMem, mutable_gpu_data, 0, 0, -1, true, null);


            if (bDiff)

                m_cuda.copy(nCount, hWorkMem, mutable_gpu_diff, nCount, 0, -1, true, null);

        }


        public void ConvertToBase(long hWorkMem, ulong lWorkSize, bool bData, bool bDiff)

        {

            int nCount = count();

            ulong lSize = (ulong)nCount * 2 * CudaDnn<T>.basetype_size(false);


            if ((long)lSize < 0)

                throw new Exception("Memory out of range!");


            if (lWorkSize < lSize)

                throw new Exception("Work memory is not large enough!");


            if (bData)

                m_cuda.copy(nCount, gpu_data, hWorkMem, 0, 0, -1, null, false);


            if (bDiff)

                m_cuda.copy(nCount, gpu_diff, hWorkMem, 0, nCount, -1, null, false);


            Reshape(shape(), false);


            if (bData)

                m_cuda.copy(nCount, hWorkMem, mutable_gpu_data, 0, 0, -1, false, null);


            if (bDiff)

                m_cuda.copy(nCount, hWorkMem, mutable_gpu_diff, nCount, 0, -1, false, null);

        }


        public bool HalfSize

        {

            get { return m_data.HalfSize; }

        }


        public bool freeze_learning

        {

            get { return m_bFreezeLearning; }

            set { m_bFreezeLearning = value; }

        }


        public CudaDnn<T> Cuda

        {

            get { return m_cuda; }

        }


        public Log Log

        {

            get { return m_log; }

        }


        protected virtual void Dispose(bool bDisposing)

        {

            if (m_diff != null)

            {

                if (m_bOwnDiff)

                    m_diff.Dispose();

                m_diff = null;

            }


            if (m_data != null)

            {

                if (m_bOwnData)

                    m_data.Dispose();

                m_data = null;

            }


            if (m_shape != null)

            {

                if (m_bOwnShape)

                    m_shape.Dispose();

                m_shape = null;

            }

        }


        public void Dispose()

        {

            Dispose(true);

        }


        public void Reshape(int nNum, int nChannels, int nHeight, int nWidth, bool? bUseHalfSize = null)

        {

            m_rgShape1[0] = nNum;

            m_rgShape1[1] = nChannels;

            m_rgShape1[2] = nHeight;

            m_rgShape1[3] = nWidth;


            Reshape(m_rgShape1, bUseHalfSize);

        }


        private string toString(List<int> rgShape)

        {

            return toString(rgShape.ToArray());

        }


        private string toString(int[] rgShape)

        {

            string str = "{";


            for (int i = 0; i < rgShape.Length; i++)

            {

                str += rgShape[i].ToString();

                str += ", ";

            }


            str = str.TrimEnd(' ', ',');

            str += "}";


            return str;

        }


        private void reshapeShape(List<int> rgShape)

        {

            reshapeShape(rgShape.ToArray());

        }


        private void reshapeShape(int[] rgShape)

        {

            m_log.CHECK_LE(rgShape.Length, MAX_BLOB_AXES, "The number of axes cannot exceed " + MAX_BLOB_AXES.ToString());

            m_nCount = 1;


            m_rgShape = new List<int>();


            if (m_shape == null)

                m_shape = new SyncedMemory<T>(m_cuda, m_log, rgShape.Length);

            else if (m_shape.Capacity < rgShape.Length)

                m_shape.Allocate(rgShape.Length);

            else if (m_shape.Count != rgShape.Length)

            {

                m_shape.Count = rgShape.Length;

                m_shape.ZeroAll();

            }


            if (rgShape.Length > 0)

            {

                T[] rgShapeData = m_shape.cpu_data;


                if (rgShapeData == null || rgShapeData.Length != rgShape.Length)

                {

                    rgShapeData = m_shape.update_cpu_data();


                    if (rgShapeData == null || rgShapeData.Length != rgShape.Length)

                        rgShapeData = new T[rgShape.Length];

                }


                bool bDirty = false;


                for (int i = 0; i < rgShape.Length; i++)

                {

                    if (rgShape[i] < 0)

                    {

                        string strBlobName = (!string.IsNullOrEmpty(m_strName)) ? "Blob '" + m_strName + "': " : "";

                        m_log.FAIL(strBlobName + "The shape value at " + i.ToString() + " of shape " + toString(rgShape) + " must be >= 0.");

                    }


                    if (m_nCount != 0)

                    {

                        if (rgShape[i] > int.MaxValue / m_nCount)

                        {

                            string strBlobName = (!string.IsNullOrEmpty(m_strName)) ? "Blob '" + m_strName + "': " : "";

                            m_log.FAIL(strBlobName + "The blob size at item " + i.ToString() + " of shape " + toString(rgShape) + " exceeds the maximum of " + (int.MaxValue / m_nCount).ToString() + "!");

                        }

                    }


                    m_nCount *= rgShape[i];

                    m_rgShape.Add(rgShape[i]);


                    int nShape = (int)(double)Convert.ChangeType(rgShapeData[i], typeof(double));


                    if (nShape != rgShape[i])

                    {

                        rgShapeData[i] = (T)Convert.ChangeType(rgShape[i], typeof(T));

                        bDirty = true;

                    }

                }


                if (bDirty)

                {

                    m_shape.mutable_cpu_data = rgShapeData;

                    m_shape.update_cpu_data();

                }

            }

        }


        public void Reshape(List<int> rgShape, bool? bUseHalfSize = null)

        {

            Reshape(rgShape.ToArray(), bUseHalfSize);

        }


        public void Reshape(int[] rgShape, bool? bUseHalfSize = null)

        {

            reshapeShape(rgShape);


            if (m_nCount > m_nCapacity || (m_data != null && m_nCount > m_data.Capacity) || (m_diff != null && m_nCount > m_diff.Capacity) || (m_data != null && bUseHalfSize.HasValue && m_data.HalfSize != bUseHalfSize.Value))

            {

                if (m_data != null)

                    m_data.Dispose();


                if (m_diff != null)

                    m_diff.Dispose();


                m_nCapacity = m_nCount;


                if (m_data == null)

                    m_data = new SyncedMemory<T>(m_cuda, m_log, m_nCapacity, null, bUseHalfSize.GetValueOrDefault(false));

                else

                    m_data.Allocate(m_nCapacity, bUseHalfSize.GetValueOrDefault(m_data.HalfSize));


                if (m_bIncludeDiff)

                {

                    if (m_diff == null)

                        m_diff = new SyncedMemory<T>(m_cuda, m_log, m_nCapacity, null, bUseHalfSize.GetValueOrDefault(false));

                    else

                        m_diff.Allocate(m_nCapacity, bUseHalfSize.GetValueOrDefault(m_data.HalfSize));

                }

            }


            if (m_data.Count != m_nCount)

                m_data.Count = m_nCount;


            if (m_bIncludeDiff)

            {

                if (m_diff.Count != m_nCount)

                    m_diff.Count = m_nCount;

            }

        }


        public void Reshape(BlobShape shape, bool? bUseHalfSize = null)

        {

            m_log.CHECK_LE(shape.dim.Count, MAX_BLOB_AXES, "The shape dimension must be less than " + MAX_BLOB_AXES.ToString());

            Reshape(shape.dim, bUseHalfSize);

        }


        public void ReshapeLike(Blob<T> b, bool? bUseHalfSize = null)

        {

            Reshape(b.shape(), bUseHalfSize);

        }


        public string shape_string

        {

            get

            {

                string strOut = "";


                for (int i = 0; i < m_rgShape.Count; i++)

                {

                    strOut += m_rgShape[i].ToString() + " ";

                }


                strOut += "(" + m_rgShape.Count.ToString() + ")";

                return strOut;

            }

        }


        public bool DiffExists

        {

            get { return m_bIncludeDiff; }

        }


        public List<int> shape()

        {

            return m_rgShape;

        }


        public int shape(int nIdx)

        {

            return m_rgShape[CanonicalAxisIndex(nIdx)];

        }


        public int num_axes

        {

            get

            {

                return m_rgShape.Count;

            }

        }


        public int num_true_axes

        {

            get

            {

                int nCount = 0;

                bool bCount = false;


                for (int i = m_rgShape.Count - 1; i >= 0; i--)

                {

                    if (bCount || m_rgShape[i] != 1)

                    {

                        nCount++;

                        bCount = true;

                    }

                }


                return nCount;

            }

        }


        public int count()

        {

            return m_nCount;

        }


        public int count(int nStartIdx, int nEndIdx)

        {

            m_log.CHECK_LE(nStartIdx, nEndIdx, "The start idx must be <= the end idx.");

            m_log.CHECK_GE(nStartIdx, 0, "The start idx must be >= 0.");

            m_log.CHECK_GE(nEndIdx, 0, "The end idx must be >= 0.");

            m_log.CHECK_LE(nStartIdx, num_axes, "The start axis must be <= the number of axes.");

            m_log.CHECK_LE(nEndIdx, num_axes, "The end axis must be <= the number of axes.");


            return Utility.Count(shape(), nStartIdx, nEndIdx);

        }


        public int count(int nStartIdx)

        {

            return count(nStartIdx, num_axes);

        }


        public int CanonicalAxisIndex(int nIdx)

        {

            m_log.CHECK_GE(nIdx, -num_axes, "The axis " + nIdx.ToString() + " out of range for " + num_axes.ToString() + " -D Blob with shape " + shape_string);

            m_log.CHECK_LT(nIdx, num_axes, "The axis " + nIdx.ToString() + " out of range for " + num_axes.ToString() + " -D Blob with shape " + shape_string);


            return Utility.CanonicalAxisIndex(nIdx, num_axes);

        }


        public int num

        {

            get { return LegacyShape(0); }

        }


        public int channels

        {

            get { return LegacyShape(1); }

        }


        public int height

        {

            get { return LegacyShape(2); }

        }


        public int width

        {

            get { return LegacyShape(3); }

        }


        public int LegacyShape(int nIdx)

        {

            m_log.CHECK_LE(num_axes, 4, "Cannot use legacy accessors on Blobs with > 4 axes.");

            m_log.CHECK_LT(nIdx, 4, "The index must be less than 4.");

            m_log.CHECK_GE(nIdx, -4, "The index must be greater than or equal to -4.");


            if (nIdx >= num_axes || nIdx < -num_axes)

            {

                // Axis is out of range, but still in [0,3] or [-4,-1] for reverse

                // indexing) -- this special case simulates the one-padding used to fill

                // extraneous axes of legacy blobs.

                return 1;

            }


            return shape(nIdx);

        }


        public int offset(int n, int c = 0, int h = 0, int w = 0)

        {

            int c1 = channels;

            int h1 = height;

            int w1 = width;


            m_log.CHECK_GE(n, 0, "n must be >= 0.");

            m_log.CHECK_LE(n, num, "n must be <= num.");

            m_log.CHECK_GE(c1, 0, "channels must be >= 0.");

            m_log.CHECK_LE(c, c1, "c must be <= channels.");

            m_log.CHECK_GE(h1, 0, "height must be >= 0.");

            m_log.CHECK_LE(h, h1, "w must be <= height.");

            m_log.CHECK_GE(w1, 0, "width must be >= 0.");

            m_log.CHECK_LE(w, w1, "w must be <= width.");


            return ((n * c1 + c) * h1 + h) * w1 + w;

        }


        public int offset(List<int> rgIdx)

        {

            m_log.CHECK_LE(rgIdx.Count, num_axes, "The index array must have an item count <= num_axes.");


            int nOffset = 0;


            for (int i = 0; i < num_axes; i++)

            {

                nOffset *= shape(i);


                if (rgIdx.Count > i)

                {

                    m_log.CHECK_GE(rgIdx[i], 0, "The index at " + i.ToString() + " must be >= 0.");

                    m_log.CHECK_LT(rgIdx[i], shape(i), "The index at " + i.ToString() + " must be <= the shape at " + i.ToString());

                    nOffset += rgIdx[i];

                }

            }


            return nOffset;

        }


        public void CopyFrom(Blob<T> src, int nSrcOffset, int nDstOffset, int nCount, bool bCopyData, bool bCopyDiff)

        {

            m_log.CHECK_GE(count(), nDstOffset + nCount, "The data to be copied is larger that the destination blob.");

            m_log.CHECK_GE(src.count(), nSrcOffset + nCount, "The data to be copied is larger than the source blob.");


            if (bCopyData)

                m_cuda.copy(nCount, src.gpu_data, mutable_gpu_data, nSrcOffset, nDstOffset);


            if (bCopyDiff)

                m_cuda.copy(nCount, src.gpu_diff, mutable_gpu_diff, nSrcOffset, nDstOffset);

        }


        public long CopyFrom(Blob<T> src, bool bCopyDiff = false, bool bReshape = false, long hDstHostBuffer = 0, bool bIgnoreShape = false)

        {

            // Ignore copy if the data points to the same handle.

            if (bCopyDiff)

            {

                if (src.gpu_diff == gpu_diff)

                    return 0;

            }

            else

            {

                if (src.gpu_data == gpu_data)

                    return 0;

            }


            if (src.count() != m_nCount || (!bIgnoreShape && !CompareShape(src.m_rgShape)))

            {

                if (bReshape)

                    ReshapeLike(src);

                else

                    m_log.FAIL("Trying to copy blobs of different sizes!");

            }


            if (bCopyDiff)

            {

                if (m_diff == null)

                    return hDstHostBuffer;


                return m_diff.Copy(src.diff, hDstHostBuffer);

            }

            else

            {

                if (m_data == null)

                    return hDstHostBuffer;


                return m_data.Copy(src.data, hDstHostBuffer);

            }

        }


        public void CopyFromAndPad(Blob<T> src, double dfPad = 0, bool bCopyDiff = false)

        {

            if (count() == src.count())

            {

                CopyFrom(src, bCopyDiff);

                return;

            }


            if (count() < src.count())

                m_log.FAIL("The destination blob must be larger than the source blob.");


            if (bCopyDiff)

            {

                SetDiff(dfPad);

                m_cuda.copy(src.count(), src.gpu_diff, mutable_gpu_diff);

            }

            else

            {

                SetData(dfPad);

                m_cuda.copy(src.count(), src.gpu_data, mutable_gpu_data);

            }

        }


        public void CopyFromAndTransposeHeightWidth(Blob<T> blobSrc, bool bCopyDiff = false, bool bUseCuda = true)

        {

            m_log.CHECK_EQ(blobSrc.num_axes, 4, "Currently, Blobs only support transposing 4 axis tensors.");


            Reshape(blobSrc.num, blobSrc.channels, blobSrc.width, blobSrc.height);


            SyncedMemory<T> dst = (bCopyDiff) ? m_diff : m_data;

            SyncedMemory<T> src = (bCopyDiff) ? blobSrc.m_diff : blobSrc.m_data;


            int nN = num;

            int nC = channels;

            int nH = height;

            int nW = width;


            if (bUseCuda)

            {

                m_cuda.transposeHW(nN, nC, nH, nW, src.gpu_data, dst.mutable_gpu_data);

            }

            else

            {

                T[] rgSrc = src.update_cpu_data();

                T[] rgDst = dst.mutable_cpu_data;


                for (int n = 0; n < nN; n++)

                {

                    for (int c = 0; c < nC; c++)

                    {

                        int nOffset = (n * nC * nH * nW) + (c * nH * nW);


                        for (int h = 0; h < nH; h++)

                        {

                            for (int w = 0; w < nW; w++)

                            {

                                int nSrcIdx = nOffset + (h * nW) + w;

                                int nDstIdx = nOffset + (w + nH) + h;

                                rgDst[nDstIdx] = rgSrc[nSrcIdx];

                            }

                        }

                    }

                }


                dst.mutable_cpu_data = rgDst;

            }

        }


        public void CopyFrom(Blob<T> blobSrc, int nChannelFrom, int nChannelTo, bool bCopyDiff = false)

        {

            m_log.CHECK_EQ(blobSrc.num, num, "The source and destination blobs must have the same num.");

            m_log.CHECK_EQ(blobSrc.height, height, "The source and destination blobs must have the same height.");

            m_log.CHECK_EQ(blobSrc.width, width, "The source and destination blobs must have the same width.");

            m_log.CHECK_LT(nChannelFrom, blobSrc.channels, "The channel form parameter is out of range!");

            m_log.CHECK_LT(nChannelTo, channels, "The channel to parameter is out of range!");


            SyncedMemory<T> dst = (bCopyDiff) ? m_diff : m_data;

            SyncedMemory<T> src = (bCopyDiff) ? blobSrc.m_diff : blobSrc.m_data;


            int nCsrc = blobSrc.channels;

            int nCdst = channels;

            int nDim = height * width;

            int nSrcOffset = nChannelFrom * nDim;

            int nDstOffset = nChannelTo * nDim;

            int nSrcStep = (nCsrc * nDim);

            int nDstStep = (nCdst * nDim);


            for (int n = 0; n < num; n++)

            {

                m_cuda.copy(nDim, src.gpu_data, dst.mutable_gpu_data, nSrcOffset, nDstOffset);

                nSrcOffset += nSrcStep;

                nDstOffset += nDstStep;

            }

        }


        public bool Compare(Blob<T> other, Blob<T> work, bool bDiff = false, double dfTol = 1e-8, bool bZeroCheck = true, bool bFullCompare = false, bool bDetectNans = true, bool bForceOtherData = false)

        {

            double dfMin;

            double dfMax;

            return CompareEx(other, work, out dfMin, out dfMax, bDiff, dfTol, bZeroCheck, bFullCompare, bDetectNans, bForceOtherData);

        }


        public bool CompareEx(Blob<T> other, Blob<T> work, out double dfMin, out double dfMax, bool bDiff = false, double dfTol = 1e-8, bool bZeroCheck = true, bool bFullCompare = false, bool bDetectNans = true, bool bForceOtherData = false)

        {

            dfMin = -1;

            dfMax = -1;


            int nCount = count();

            if (nCount != other.count())

                return false;


            if (nCount == 0)

                return true;


            if (Cuda.KernelHandle != other.Cuda.KernelHandle)

                throw new Exception("The compare blob has a different Cuda Kernel Handles!");


            if (Cuda.KernelHandle != work.Cuda.KernelHandle)

                throw new Exception("The work blob has a different Cuda Kernel Handle!");


            work.ReshapeLike(this);


            long h1 = (bDiff) ? gpu_diff : gpu_data;

            long h2 = (bDiff && !bForceOtherData) ? other.gpu_diff : other.gpu_data;

            long lPos;


            m_cuda.sub(nCount, h1, h2, work.mutable_gpu_data);

            dfMin = m_cuda.min(nCount, work.gpu_data, out lPos, 0, work.mutable_gpu_diff);

            dfMax = m_cuda.max(nCount, work.gpu_data, out lPos, 0, work.mutable_gpu_diff);


            if (Math.Abs(dfMin) > dfTol)

                return false;


            if (dfMax > dfTol)

                return false;


            if (bDetectNans)

            {

                Tuple<double, double, double, double> minmax1 = m_cuda.minmax(nCount, h1, work.gpu_data, work.gpu_diff, true);

                if (minmax1.Item3 > 0 || minmax1.Item4 > 0)

                    return false;


                Tuple<double, double, double, double> minmax2 = m_cuda.minmax(nCount, h2, work.gpu_data, work.gpu_diff, true);

                if (minmax2.Item3 > 0 || minmax2.Item4 > 0)

                    return false;

            }


            if (bZeroCheck)

            {

                double dfZero1 = m_cuda.asum_double(nCount, h1);

                double dfZero2 = m_cuda.asum_double(nCount, h2);


                if ((dfZero1 == 0 && dfZero2 != 0) || (dfZero1 != 0 && dfZero2 == 0))

                    return false;

            }


            if (bFullCompare)

            {

                float[] rgf1 = Utility.ConvertVecF<T>((bDiff) ? mutable_cpu_diff : mutable_cpu_data);

                float[] rgf2 = Utility.ConvertVecF<T>((bDiff) ? other.mutable_cpu_diff : other.mutable_cpu_data);

                Dictionary<int, float> rgErr = new Dictionary<int, float>();


                for (int i = 0; i < rgf1.Length; i++)

                {

                    float f1 = rgf1[i];

                    float f2 = rgf2[i];

                    float fDiff = Math.Abs(f1 - f2);


                    if (fDiff > dfTol)

                        rgErr.Add(i, fDiff);

                }


                if (rgErr.Count > 0)

                    return false;

            }


            return true;

        }


        public bool ValidateData(Blob<T> work, bool bDiff = false)

        {

            int nCount = count();

            long h1 = (bDiff) ? gpu_diff : gpu_data;


            work.ReshapeLike(this);


            Tuple<double, double, double, double> minmax1 = m_cuda.minmax(nCount, h1, work.gpu_data, work.gpu_diff, true);

            if (minmax1.Item3 > 0 || minmax1.Item4 > 0)

                return false;


            return true;

        }


        public bool Compare(CudaDnn<double> cuda, Blob<T> other, Blob<double> work, bool bDiff = false, double dfTol = 1e-8)

        {

            if (count() != other.count())

                return false;


            work.Reshape(num, channels, height, width);

            work.mutable_cpu_data = (bDiff) ? Utility.ConvertVec<T>(mutable_cpu_diff) : Utility.ConvertVec<T>(mutable_cpu_data);

            work.mutable_cpu_diff = (bDiff) ? Utility.ConvertVec<T>(other.mutable_cpu_diff) : Utility.ConvertVec<T>(other.mutable_cpu_data);


            cuda.sub(count(), work.gpu_data, work.gpu_diff, work.mutable_gpu_data);

            double dfMin = work.min_data;

            if (Math.Abs(dfMin) > dfTol)

                return false;


            double dfMax = work.max_data;

            if (dfMax > dfTol)

                return false;


            return true;

        }


#pragma warning disable 1591


        public void KeepBestResultsByChannel(int nNumberToKeep)

        {

            m_log.CHECK_EQ(num_axes, 4, "Currently KeepBestResutls only works on 4-axis blobs.");


            T[] rgData = mutable_cpu_data;

            int nN = num;

            int nC = channels;

            int nH = height;

            int nW = width;

            List<List<KeyValuePair<int, float>>> rgrgKeyValues = new List<List<KeyValuePair<int, float>>>();

            List<List<List<List<float>>>> rgrgrgrgData = new List<List<List<List<float>>>>();


            for (int n = 0; n < nN; n++)

            {

                List<KeyValuePair<int, float>> rgKeyValues = new List<KeyValuePair<int, float>>();

                List<List<List<float>>> rgrgrgData = new List<List<List<float>>>();


                for (int c = 0; c < nC; c++)

                {

                    float fSum = 0;

                    List<List<float>> rgrgData = new List<List<float>>();


                    for (int h = 0; h < nH; h++)

                    {

                        List<float> rgVal = new List<float>();


                        for (int w = 0; w < nW; w++)

                        {

                            int nIdx = (n * nC * nH * nW) + (c * nH * nW) + (h * nW) + w;

                            float fVal = (float)Convert.ChangeType(rgData[nIdx], typeof(float));

                            rgVal.Add(fVal);

                            fSum += fVal;

                        }


                        rgrgData.Add(rgVal);

                    }


                    rgKeyValues.Add(new KeyValuePair<int, float>(c, fSum));

                    rgrgrgData.Add(rgrgData);

                }


                rgKeyValues.Sort(new Comparison<KeyValuePair<int, float>>(sort));


                rgrgKeyValues.Add(rgKeyValues);

                rgrgrgrgData.Add(rgrgrgData);

            }


            SetData(0);

            rgData = mutable_cpu_data;


            for (int n = 0; n < nN; n++)

            {

                List<KeyValuePair<int, float>> rgKeyValues = rgrgKeyValues[n];

                List<List<List<float>>> rgrgrgData = rgrgrgrgData[n];

                List<int> rgIdx = new List<int>();


                for (int i = 0; i < nNumberToKeep && i < rgKeyValues.Count; i++)

                {

                    rgIdx.Add(rgKeyValues[i].Key);

                }


                foreach (int c in rgIdx)

                {

                    List<List<float>> rgrgData = rgrgrgData[c];


                    for (int h = 0; h < nH; h++)

                    {

                        List<float> rgVal = rgrgData[h];


                        for (int w = 0; w < nW; w++)

                        {

                            int nIdx = (n * nC * nH * nW) + (c * nH * nW) + (h * nW) + w;

                            rgData[nIdx] = (T)Convert.ChangeType(rgVal[w], typeof(T));

                        }

                    }

                }

            }


            mutable_cpu_data = rgData;

        }


        public void KeepBestResultsByWeight(int nNumberToKeep)

        {

            m_log.CHECK_EQ(num_axes, 4, "Currently KeepBestResutls only works on 4-axis blobs.");


            T[] rgData = mutable_cpu_data;

            int nN = num;

            int nC = channels;

            int nH = height;

            int nW = width;

            List<List<KeyValuePair<int, float>>> rgrgKeyValues = new List<List<KeyValuePair<int, float>>>();


            for (int n = 0; n < nN; n++)

            {

                List<KeyValuePair<int, float>> rgKeyValues = new List<KeyValuePair<int, float>>();


                for (int c = 0; c < nC; c++)

                {

                    for (int h = 0; h < nH; h++)

                    {

                        for (int w = 0; w < nW; w++)

                        {

                            int nIdx = (n * nC * nH * nW) + (c * nH * nW) + (h * nW) + w;

                            rgKeyValues.Add(new KeyValuePair<int, float>(nIdx, (float)Convert.ChangeType(rgData[nIdx], typeof(float))));

                        }

                    }

                }


                rgKeyValues.Sort(new Comparison<KeyValuePair<int, float>>(sort));

                rgrgKeyValues.Add(rgKeyValues);

            }


            SetData(0);

            rgData = mutable_cpu_data;


            for (int n = 0; n < nN; n++)

            {

                List<KeyValuePair<int, float>> rgKeyValues = rgrgKeyValues[n];


                for (int i = 0; i < nNumberToKeep && i < rgKeyValues.Count; i++)

                {

                    KeyValuePair<int, float> kv = rgKeyValues[i];

                    rgData[kv.Key] = (T)Convert.ChangeType(kv.Value, typeof(T));

                }

            }


            mutable_cpu_data = rgData;

        }


#pragma warning restore 1591


        private int sort(KeyValuePair<int, float> a, KeyValuePair<int, float> b)

        {

            if (a.Value < b.Value)

                return 1;


            if (a.Value > b.Value)

                return -1;


            return 0;

        }


        public T data_at(int n, int c, int h, int w)

        {

            return m_data.GetAt(offset(n, c, h, w));

        }


        public T diff_at(int n, int c, int h, int w)

        {

            return m_diff.GetAt(offset(n, c, h, w));

        }


        public T data_at(List<int> rgIdx)

        {

            return m_data.GetAt(offset(rgIdx));

        }


        public T diff_at(List<int> rgIdx)

        {

            return m_diff.GetAt(offset(rgIdx));

        }


        public SyncedMemory<T> data

        {

            get { return m_data; }

        }


        public SyncedMemory<T> diff

        {

            get { return m_diff; }

        }


        public T[] cpu_data

        {

            get { return m_data.cpu_data; }

        }


        public T[] mutable_cpu_data

        {

            get { return m_data.mutable_cpu_data; }

            set { m_data.mutable_cpu_data = value; }

        }


        public T[] update_cpu_data()

        {

            return m_data.update_cpu_data(m_nCount);

        }


        public long gpu_data

        {

            get { return m_data.gpu_data; }

        }


        public long mutable_gpu_data

        {

            get { return m_data.mutable_gpu_data; }

//            set { m_data.mutable_gpu_data = value; }

        }


        public T[] cpu_diff

        {

            get

            {

                if (m_diff == null)

                    return null;


                return m_diff.cpu_data;

            }

        }


        public T[] mutable_cpu_diff

        {

            get

            {

                if (m_diff == null)

                    return null;


                return m_diff.mutable_cpu_data;

            }

            set

            {

                m_diff.mutable_cpu_data = value;

            }

        }


        public T[] update_cpu_diff()

        {

            if (m_diff == null)

                return null;


            return m_diff.update_cpu_data(m_nCount);

        }


        public long gpu_diff

        {

            get

            {

                if (m_diff == null)

                    return 0;


                return m_diff.gpu_data;

            }

        }


        public long mutable_gpu_diff

        {

            get { return m_diff.mutable_gpu_data; }

//            set { m_diff.mutable_gpu_data = value; }

        }


        public long gpu_shape

        {

            get { return m_shape.gpu_data; }

        }


        public void Update()

        {

            if (!m_bIncludeDiff || m_bFreezeLearning)

                return;


            // The GPU is assumed to be the owner of the data.

            m_cuda.axpy(m_nCount, m_tMinusOne, m_diff.gpu_data, m_data.mutable_gpu_data);

        }


        public void FromProto(BlobProto bp, bool bReshape = true)

        {

            if (bReshape)

            {

                List<int> rgShape = new List<int>();


                if (bp.num.HasValue || bp.channels.HasValue || bp.height.HasValue || bp.width.HasValue)

                {

                    // Using depreciated 4D Blob dimensions --

                    // shape is (num, channels, height, width).

                    if (bp.num.HasValue)

                        rgShape.Add(bp.num.Value);


                    if (bp.channels.HasValue)

                        rgShape.Add(bp.channels.Value);


                    if (bp.height.HasValue)

                        rgShape.Add(bp.height.Value);


                    if (bp.width.HasValue)

                        rgShape.Add(bp.width.Value);

                }

                else

                {

                    rgShape = Utility.Clone<int>(bp.shape.dim);

                }


                Reshape(rgShape);

            }

            else

            {

                m_log.CHECK(ShapeEquals(bp), "Shape mismatch (reshape not set)!");

            }


            // Copy the data.

            T[] rgData = null;


            if (bp.double_data.Count > 0)

            {

                m_log.CHECK_EQ(m_nCount, bp.double_data.Count, "The double data count is not the same as the blob data count!");

                rgData = Utility.ConvertVec<T>(bp.double_data.ToArray());

            }

            else if (bp.data.Count > 0)

            {

                m_log.CHECK_EQ(m_nCount, bp.data.Count, "The double data count is not the same as the blob data count!");

                rgData = Utility.ConvertVec<T>(bp.data.ToArray());

            }


            if (rgData != null)

                mutable_cpu_data = rgData;


            // Copy the diff.

            T[] rgDiff = null;


            if (bp.double_diff.Count > 0)

            {

                m_log.CHECK_EQ(m_nCount, bp.double_diff.Count, "The double diff count is not the same as the blob data count!");

                rgDiff = Utility.ConvertVec<T>(bp.double_diff.ToArray());

            }

            else if (bp.diff.Count > 0)

            {

                m_log.CHECK_EQ(m_nCount, bp.diff.Count, "The double data count is not the same as the blob data count!");

                rgDiff = Utility.ConvertVec<T>(bp.diff.ToArray());

            }


            if (rgDiff != null)

                mutable_cpu_diff = rgDiff;

        }


        public BlobProto ToProto(bool bWriteDiff = false)

        {

            BlobProto bp = new BlobProto(m_rgShape);


            T[] rgData = (bWriteDiff) ? null : update_cpu_data();

            T[] rgDiff = (bWriteDiff) ? update_cpu_diff() : null;


            if (typeof(T) == typeof(double))

            {

                if (rgData != null)

                {

                    double[] rgDataD = Utility.ConvertVec<T>(rgData);

                    bp.double_data = new List<double>(rgDataD);

                }


                if (rgDiff != null)

                {

                    double[] rgDiffD = Utility.ConvertVec<T>(rgData);

                    bp.double_diff = new List<double>(rgDiffD);

                }

            }

            else

            {

                if (rgData != null)

                {

                    float[] rgDataF = Utility.ConvertVecF<T>(rgData);

                    bp.data = new List<float>(rgDataF);

                }


                if (rgDiff != null)

                {

                    float[] rgDiffF = Utility.ConvertVecF<T>(rgDiff);

                    bp.diff = new List<float>(rgDiffF);

                }

            }


            return bp;

        }


        public T asum_data()

        {

            if (m_nCount == 0 || gpu_data == 0)

                return m_tZero;


            return m_cuda.asum(m_nCount, gpu_data);

        }


        public T asum_diff()

        {

            if (m_nCount == 0 || gpu_diff == 0)

                return m_tZero;


            return m_cuda.asum(m_nCount, gpu_diff);

        }


        public T sumsq_data()

        {

            if (m_nCount == 0 || gpu_data == 0)

                return m_tZero;


            return m_cuda.dot(m_nCount, gpu_data, gpu_data);

        }


        public T sumsq_diff()

        {

            if (m_nCount == 0 || gpu_diff == 0)

                return m_tZero;


            return m_cuda.dot(m_nCount, gpu_diff, gpu_diff);

        }


        public void scale_data(double df)

        {

            scale_data((T)Convert.ChangeType(df, typeof(T)));

        }


        public void scale_diff(double df)

        {

            scale_diff((T)Convert.ChangeType(df, typeof(T)));

        }


        public void scale_to_range(double dfMin, double dfMax)

        {

            m_cuda.scale_to_range(m_nCount, gpu_data, mutable_gpu_data, dfMin, dfMax);

        }


        public void scale_data(T fScaleFactor)

        {

            m_cuda.scal(m_nCount, fScaleFactor, mutable_gpu_data);

        }


        public void scale_diff(T fScaleFactor)

        {

            m_cuda.scal(m_nCount, fScaleFactor, mutable_gpu_diff);

        }


        public bool reshape_when_sharing

        {

            get { return m_bReshapeWhenSharing; }

            set { m_bReshapeWhenSharing = value; }

        }


        public void ShareData(Blob<T> b)

        {

            if (!m_bReshapeWhenSharing)

                m_log.CHECK_EQ(m_nCount, b.count(), "The blob counts are not the same!");

            else

                reshapeShape(b.shape());


            if (m_bOwnData && m_data != null)

                m_data.Dispose();


            m_data = b.m_data;

            m_bOwnData = false;

        }


        public void ShareDiff(Blob<T> b)

        {

            if (!m_bReshapeWhenSharing)

                m_log.CHECK_EQ(m_nCount, b.count(), "The blob counts are not the same!");

            else

                reshapeShape(b.shape());


            if (m_bOwnDiff && m_diff != null)

                m_diff.Dispose();


            m_diff = b.m_diff;

            m_bOwnDiff = false;

        }


        public void Share(Blob<T> b)

        {

            if (m_bOwnData && m_data != null)

                m_data.Dispose();


            m_data = b.m_data;

            m_bOwnData = false;


            if (m_bOwnDiff && m_diff != null)

                m_diff.Dispose();


            m_diff = b.m_diff;

            m_bOwnDiff = false;


            if (m_bOwnShape && m_shape != null)

                m_shape.Dispose();


            m_shape = b.m_shape;

            m_bOwnShape = false;


            m_nCount = b.m_nCount;

            m_nCapacity = b.m_nCapacity;

            m_rgShape = b.m_rgShape;

            m_nIdx = b.m_nIdx;

        }


        public bool snapshot_requested

        {

            get { return m_bSnapshotRequested; }

            set { m_bSnapshotRequested = value; }

        }


        public T GetData(int nIdx)

        {

            T[] rg = m_cuda.get(count(), gpu_data, nIdx);

            if (rg.Length == 0)

                throw new Exception("No data at index = " + nIdx.ToString());


            return rg[0];

        }


        public T GetDiff(int nIdx)

        {

            T[] rg = m_cuda.get(count(), gpu_diff, nIdx);

            if (rg.Length == 0)

                throw new Exception("No data at index = " + nIdx.ToString());


            return rg[0];

        }


        public void SetData(T[] rgData, int nCount = -1, bool bSetCount = true)

        {

            m_data.SetData(rgData, nCount, bSetCount);

        }


        public void SetData(T fVal, int nIdx = -1)

        {

            if (mutable_gpu_data == 0)

                return;


            m_cuda.set(count(), mutable_gpu_data, fVal, nIdx);

        }


        public void SetData(double dfVal, int nIdx = -1)

        {

            if (mutable_gpu_data == 0)

                return;


            m_cuda.set(count(), mutable_gpu_data, dfVal, nIdx);

        }


        public void SetData(double dfVal, int nStartIdx, int nCount)

        {

            T tVal = (T)Convert.ChangeType(dfVal, typeof(T));

            T[] rg = mutable_cpu_data;


            for (int i = 0; i < nCount; i++)

            {

                if (nStartIdx + i < rg.Length)

                    rg[nStartIdx + i] = tVal;

            }


            mutable_cpu_data = rg;

        }


        public void SetDiff(double dfVal, int nIdx = -1)

        {

            if (m_bIncludeDiff)

            {

                if (mutable_gpu_diff == 0)

                    return;


                m_cuda.set(count(), mutable_gpu_diff, dfVal, nIdx);

            }

        }


        public void SetDiff(double dfVal, int nStartIdx, int nCount)

        {

            T tVal = (T)Convert.ChangeType(dfVal, typeof(T));

            T[] rg = mutable_cpu_diff;


            for (int i = 0; i < nCount; i++)

            {

                if (nStartIdx + i < rg.Length)

                    rg[nStartIdx + i] = tVal;

            }


            mutable_cpu_diff = rg;

        }


        public void SetDiff(T[] rgDiff, int nCount = -1, bool bSetCount = true)

        {

            m_diff.SetData(rgDiff, nCount, bSetCount);

        }


        public void SetData(SimpleDatum d, bool bReshape, bool bCopyData = true)

        {

            if (bReshape)

            {

                m_nCapacity = 0;

                Reshape(1, d.Channels, d.Height, d.Width);

            }


            T[] rgData = d.GetData<T>();


            m_log.CHECK_EQ(rgData.Length, count(), "The datum data length of " + rgData.Length.ToString() + " should be equal to the Blob count() of " + count().ToString());


            if (bCopyData)

            {

                mutable_cpu_data = rgData;

                m_nIdx = d.Index;

            }

        }


        public void SetCPUData(T[] rg)

        {

            m_bCpuDataReadyForPush = true;

            m_data.set_cpu_data_locally(rg);

        }


        public void AsyncGpuPush(long hStream)

        {

            if (!m_bCpuDataReadyForPush)

                return;


            if (m_data.cpu_data == null)

                throw new Exception("There is no CPU data to push to the GPU!");


            m_data.async_gpu_push(hStream, m_data.cpu_data);

            m_bCpuDataReadyForPush = false;

        }


        public bool ShapeEquals(BlobProto bp)

        {

            if (bp.num.HasValue || bp.channels.HasValue || bp.height.HasValue || bp.width.HasValue)

            {

                // Using drepreciated 4D blob dimensions --

                // shape is (num, channels, height, width).

                // Note: we do not use the normal Blob::num, Blob::channels() etc.

                // methods as these index from the beginning of the blob shape, where legacy

                // parameter blobs were indexed from the end of the blob shape (e.g., bias

                // Blob shape (1 x 1 x 1 x N), IP layer weight Blob shape (1 x 1 x M x N).

                if (m_rgShape.Count <= 4 &&

                    LegacyShape(-4) == bp.num.GetValueOrDefault(1) &&

                    LegacyShape(-3) == bp.channels.GetValueOrDefault(1) &&

                    LegacyShape(-2) == bp.height.GetValueOrDefault(1) &&

                    LegacyShape(-1) == bp.width.GetValueOrDefault(1))

                    return true;

                else

                    return false;

            }


            return Utility.Compare<int>(m_rgShape, bp.shape.dim);

        }


        public bool CompareShape(List<int> rgShape, bool bCompareCpuDataLen = false)

        {

            while (rgShape.Count < num_axes)

            {

                rgShape.Add(1);

            }


            if (shape().Count == 0 && rgShape.Count == 0)

                return true;


            if (shape().Count == 0 && rgShape.Count == 1 && rgShape[0] == 0)

                return true;


            List<int> rgShape1 = new List<int>(shape());

            while (rgShape1.Count < rgShape.Count)

            {

                rgShape1.Add(1);

            }


            if (bCompareCpuDataLen)

            {

                int nCount = 1;

                for (int i = 0; i < rgShape.Count; i++)

                {

                    nCount *= rgShape[i];

                }


                if (cpu_data == null || cpu_data.Length != nCount)

                    return false;

            }


            return Utility.Compare<int>(rgShape1, rgShape);

        }


        public bool CompareShape(int[] rgShape, bool bCompareCpuDataLen = false)

        {

            return CompareShape(new List<int>(rgShape), bCompareCpuDataLen);

        }


        public string ToSizeString()

        {

            return num.ToString() + "," + channels.ToString() + "," + height.ToString() + "," + width.ToString();

        }


        public Datum ToDatum()

        {

            if (typeof(T) == typeof(double))

            {

                double[] rgData = m_cuda.GetMemoryDouble(gpu_data, count());

                return new Datum(true, channels, width, height, -1, DateTime.MinValue, new List<double>(rgData), 0, false, -1);

            }

            else

            {

                float[] rgData = m_cuda.GetMemoryFloat(gpu_data, count());

                return new Datum(true, channels, width, height, -1, DateTime.MinValue, new List<float>(rgData), 0, false, -1);

            }

        }


        public string Name

        {

            get { return m_strName; }

            set

            {

                m_strName = value;


                if (m_data != null)

                    m_data.Tag = m_strName + " data";


                if (m_diff != null)

                    m_diff.Tag = m_strName + " diff";

            }

        }


        public Blob<T> Clone()

        {

            Blob<T> b = new Blob<T>(m_cuda, m_log);


            b.ReshapeLike(this, HalfSize);


            if (m_diff != null)

                b.m_diff.Copy(m_diff);


            b.m_data.Copy(m_data);

            b.Name = Name;

            b.m_bReshapeWhenSharing = reshape_when_sharing;


            return b;

        }


        public Blob<T> MathAdd(Blob<T> blobA, T fScale)

        {

            Blob<T> bOut = blobA.Clone();


            if ((double)Convert.ChangeType(fScale, typeof(double)) != 1.0)

                bOut.scale_data(fScale);


            m_cuda.add(bOut.count(), bOut.gpu_data, gpu_data, bOut.mutable_gpu_data);


            return bOut;

        }


        public Blob<T> MathSub(Blob<T> blobA)

        {

            Blob<T> bOut = blobA.Clone();


            m_cuda.sub(bOut.count(), bOut.gpu_data, gpu_data, bOut.mutable_gpu_data);


            return bOut;

        }


        public Blob<T> MathDiv(T fScale)

        {

            Blob<T> bOut = Clone();


            double dfVal = 1.0/(double)Convert.ChangeType(fScale, typeof(double));


            m_cuda.mul_scalar(bOut.count(), (T)Convert.ChangeType(dfVal, typeof(T)), bOut.mutable_gpu_data);


            return bOut;

        }


        public void SaveBinary(string strFile, bool bData, bool bDiff, bool bIncludeName = true)

        {

            using (FileStream fs = File.OpenWrite(strFile))

            using (BinaryWriter bw = new BinaryWriter(fs))

            {

                Save(bw, bData, bDiff, bIncludeName);

            }

        }


        public void Save(BinaryWriter bw, bool bData, bool bDiff, bool bIncludeName = true)

        {

            if (!bIncludeName)

            {

                bw.Write(0);

            }

            else

            {

                bw.Write(m_strName.Length);

                bw.Write(m_strName);

            }


            bw.Write(m_rgShape.Count);

            for (int i = 0; i < m_rgShape.Count; i++)

            {

                bw.Write(m_rgShape[i]);

            }


            bw.Write(m_nCount);


            if (bData)

            {

                bw.Write(m_nCount);


                double[] rgdfData = Utility.ConvertVec<T>(update_cpu_data());


                foreach (double dfVal in rgdfData)

                {

                    bw.Write(dfVal);

                }

            }

            else

            {

                bw.Write((int)0);

            }


            if (bDiff)

            {

                bw.Write(m_nCount);


                double[] rgdfDiff = Utility.ConvertVec<T>(update_cpu_diff());


                foreach (double dfVal in rgdfDiff)

                {

                    bw.Write(dfVal);

                }

            }

            else

            {

                bw.Write((int)0);

            }

        }


        public static Blob<T> LoadBinary(CudaDnn<T> cuda, Log log, string strFile, bool bData, bool bDiff)

        {

            using (FileStream fs = File.OpenRead(strFile))

            using (BinaryReader br = new BinaryReader(fs))

            {

                return Load(cuda, log, br, bData, bDiff);

            }

        }


        public static Blob<T> Load(CudaDnn<T> cuda, Log log, BinaryReader br, bool bData, bool bDiff)

        {

            Blob<T> b = new Blob<T>(cuda, log);


            int nNameLen = br.ReadInt32();

            if (nNameLen > 0)

                b.Name = br.ReadString();


            List<int> rgShape = new List<int>();

            int nCount = br.ReadInt32();


            for (int i = 0; i < nCount; i++)

            {

                rgShape.Add(br.ReadInt32());

            }


            b.Reshape(rgShape);


            int nItemCount = br.ReadInt32();

            int nDataCount = br.ReadInt32();


            if (nDataCount > nItemCount)

                throw new Exception("Invalid data count read!");


            List<double> rgData = new List<double>();


            for (int i = 0; i < nDataCount; i++)

            {

                rgData.Add(br.ReadDouble());

            }


            int nDiffCount = br.ReadInt32();


            if (nDiffCount > nItemCount)

                throw new Exception("Invalid diff count read!");


            List<double> rgDiff = new List<double>();


            for (int i = 0; i < nDiffCount; i++)

            {

                rgDiff.Add(br.ReadDouble());

            }


            if (nDataCount > 0 && nDiffCount > 0 && nDataCount != nDiffCount)

                throw new Exception("Invalid diff and data counts read - they should be equal!");


            if (bData && rgData.Count > 0)

                b.mutable_cpu_data = Utility.ConvertVec<T>(rgData.ToArray());


            if (bDiff && rgDiff.Count > 0)

                b.mutable_cpu_diff = Utility.ConvertVec<T>(rgDiff.ToArray());


            return b;

        }


        public byte[] ToByteArray()

        {

            using (MemoryStream ms = new MemoryStream())

            using (BinaryWriter bw = new BinaryWriter(ms))

            {

                Save(bw, true, false, true);

                return ms.ToArray();

            }

        }


        public static Blob<T> FromByteArray(CudaDnn<T> cuda, Log log, byte[] rg)

        {

            using (MemoryStream ms = new MemoryStream(rg))

            using (BinaryReader br = new BinaryReader(ms))

            {

                return Load(cuda, log, br, true, true);

            }

        }


        public override string ToString()

        {

            string strSize = (HalfSize) ? "HALF " : "FULL ";

            return strSize + m_strName + " (" + shape_string + ")";

        }


        public string ToString(int nMax, bool bDiff = false)

        {

            double[] rg = Utility.ConvertVec<T>((bDiff) ? update_cpu_diff() : update_cpu_data());

            string str = "{";


            for (int i = 0; i < rg.Length && i < nMax; i++)

            {

                str += rg[i].ToString("N4");

                str += ",";

            }


            str = str.TrimEnd(',');

            str += "}";


            return str;

        }


        public double min_data

        {

            get

            {

                long lPos;

                return GetMinData(out lPos);

            }

        }


        public double GetMinData(out long lPos)

        {

            lPos = -1;

            if (count() == 0 || gpu_data == 0)

                return 0;


            return m_cuda.min(count(), gpu_data, out lPos);

        }


        public double max_data

        {

            get

            {

                long lPos;

                return GetMaxData(out lPos);

            }

        }


        public double GetMaxData(out long lPos)

        {

            lPos = -1;

            if (count() == 0 || gpu_data == 0)

                return 0;


            return m_cuda.max(count(), gpu_data, out lPos);

        }


        public double min_diff

        {

            get

            {

                long lPos;

                return GetMinDiff(out lPos);

            }

        }


        public double GetMinDiff(out long lPos)

        {

            lPos = -1;

            if (count() == 0 || gpu_diff == 0)

                return 0;


            return m_cuda.min(count(), gpu_diff, out lPos);

        }


        public double max_diff

        {

            get

            {

                long lPos;

                return GetMaxDiff(out lPos);

            }

        }


        public double GetMaxDiff(out long lPos)

        {

            lPos = -1;

            if (count() == 0 || gpu_diff == 0)

                return 0;


            return m_cuda.max(count(), gpu_diff, out lPos);

        }


        private int get_index_up_to(List<int> rgShape, int nMax = 12800)

        {

            int nIndexUpTo = m_rgShape.Count - 1;

            int nNum = m_rgShape[nIndexUpTo];


            while (nIndexUpTo > 0 && nNum < nMax)

            {

                nNum *= m_rgShape[nIndexUpTo-1];

                if (nNum < nMax)

                    nIndexUpTo--;

            }


            if (nNum > 1 && nIndexUpTo == 0 && m_rgShape.Count > 1)

                nIndexUpTo++;


            return nIndexUpTo;

        }


        public Tuple<double, double, double, double> minmax_data(Blob<T> work, bool bDetectNans = false, bool bUseChunks = false)

        {

            int nCount = count();


            if (nCount == 0 || gpu_data == 0)

                return new Tuple<double, double, double, double>(0, 0, 0, 0);


            if (nCount == 1)

            {

                double[] rgdf = Utility.ConvertVec<T>(mutable_cpu_data);

                return new Tuple<double, double, double, double>(rgdf[0], rgdf[0], double.IsNaN(rgdf[0]) ? 1 : 0, double.IsInfinity(rgdf[0]) ? 1 : 0);

            }


            work.Reshape(nCount + 64, 1, 1, 1);

            work.ReshapeLike(this);


            int nIndexUpTo = get_index_up_to(m_rgShape);

            if (nIndexUpTo == 0 || nIndexUpTo >= m_rgShape.Count || !bUseChunks)

                return m_cuda.minmax(nCount, gpu_data, work.mutable_gpu_data, work.mutable_gpu_diff, bDetectNans);


            List<double> rgdfMax = new List<double>();

            List<double> rgdfMin = new List<double>();

            List<double> rgdfItem3 = new List<double>();

            List<double> rgdfItem4 = new List<double>();

            List<int> rgShape = new List<int>();

            int nNum = 1;


            for (int i = 0; i < m_rgShape.Count; i++)

            {

                if (i < nIndexUpTo)

                {

                    nNum *= m_rgShape[i];

                    rgShape.Add(1);

                }

                else

                {

                    rgShape.Add(m_rgShape[i]);

                }

            }


            Blob<T> item = new Blob<T>(m_cuda, m_log, rgShape, false);


            for (int i = 0; i < nNum; i++)

            {

                nCount = item.count();

                m_cuda.copy(nCount, gpu_data, item.mutable_gpu_data, i * nCount, 0);

                Tuple<double, double, double, double> minmax = m_cuda.minmax(nCount, item.gpu_data, work.mutable_gpu_data, work.mutable_gpu_diff, bDetectNans);

                rgdfMin.Add(minmax.Item1);

                rgdfMax.Add(minmax.Item2);

                rgdfItem3.Add(minmax.Item3);

                rgdfItem4.Add(minmax.Item4);

            }


            item.Dispose();


            double dfMin = rgdfMin.Min(p => p);

            double dfMax = rgdfMax.Max(p => p);

            double dfItem3 = rgdfItem3.Sum(p => p);

            double dfItem4 = rgdfItem4.Sum(p => p);


            return new Tuple<double, double, double, double>(dfMin, dfMax, dfItem3, dfItem4);

        }


        public Tuple<double, double, double, double> minmax_diff(Blob<T> work, bool bDetectNans = false, bool bUseChunks = false)

        {

            int nCount = count();


            if (nCount == 0 || gpu_diff == 0)

                return new Tuple<double, double, double, double>(0, 0, 0, 0);


            if (nCount == 1)

            {

                double[] rgdf = Utility.ConvertVec<T>(mutable_cpu_diff);

                return new Tuple<double, double, double, double>(rgdf[0], rgdf[0], double.IsNaN(rgdf[0]) ? 1 : 0, double.IsInfinity(rgdf[0]) ? 1 : 0);

            }


            work.Reshape(nCount + 64, 1, 1, 1);

            work.ReshapeLike(this);


            int nIndexUpTo = get_index_up_to(m_rgShape);

            if (nIndexUpTo == 0 || nIndexUpTo >= m_rgShape.Count || !bUseChunks)

                return m_cuda.minmax(nCount, gpu_diff, work.mutable_gpu_data, work.mutable_gpu_diff, bDetectNans);


            List<double> rgdfMax = new List<double>();

            List<double> rgdfMin = new List<double>();

            List<double> rgdfItem3 = new List<double>();

            List<double> rgdfItem4 = new List<double>();

            List<int> rgShape = new List<int>();

            int nNum = 1;


            for (int i = 0; i < m_rgShape.Count; i++)

            {

                if (i < nIndexUpTo)

                {

                    nNum *= m_rgShape[i];

                    rgShape.Add(1);

                }

                else

                {

                    rgShape.Add(m_rgShape[i]);

                }

            }


            Blob<T> item = new Blob<T>(m_cuda, m_log, rgShape, false);


            for (int i = 0; i < nNum; i++)

            {

                nCount = item.count();

                m_cuda.copy(nCount, gpu_diff, item.mutable_gpu_data, i * nCount, 0);

                Tuple<double, double, double, double> minmax = m_cuda.minmax(nCount, item.gpu_data, work.mutable_gpu_data, work.mutable_gpu_diff, bDetectNans);

                rgdfMin.Add(minmax.Item1);

                rgdfMax.Add(minmax.Item2);

                rgdfItem3.Add(minmax.Item3);

                rgdfItem4.Add(minmax.Item4);

            }


            item.Dispose();


            double dfMin = rgdfMin.Min(p => p);

            double dfMax = rgdfMax.Max(p => p);

            double dfItem3 = rgdfItem3.Sum(p => p);

            double dfItem4 = rgdfItem4.Sum(p => p);


            return new Tuple<double, double, double, double>(dfMin, dfMax, dfItem3, dfItem4);

        }


        public BLOB_TYPE type

        {

            get { return m_type; }

            set { m_type = value; }

        }


        public object Tag

        {

            get { return m_tag; }

            set { m_tag = value; }

        }


        public void add_scalar(double dfVal)

        {

            m_cuda.add_scalar(count(), dfVal, mutable_gpu_data);

        }


#pragma warning disable 1591


        public void rollaxis()

        {

            long hDataT = m_cuda.AllocMemory(mutable_cpu_data);

            m_cuda.matrix_transpose(width * height, channels, hDataT, mutable_gpu_data);

            m_cuda.FreeMemory(hDataT);

        }


        public void save_images(string strPath, Blob<T> blobLabels, double dfScale)

        {

            if (!Directory.Exists(strPath))

                Directory.CreateDirectory(strPath);


            T[] rgLabels = blobLabels.update_cpu_data();

            T[] rgData = update_cpu_data();


            if (dfScale != 1.0)

            {

                for (int i = 0; i < rgData.Length; i++)

                {

                    double dfVal = Utility.ConvertVal<T>(rgData[i]);


                    if (dfVal != 0)

                    {

                        dfVal /= dfScale;


                        if (dfVal < 0)

                            dfVal = 0;


                        if (dfVal > 255)

                            dfVal = 255;


                        rgData[i] = Utility.ConvertVal<T>(dfVal);

                    }

                }

            }


            strPath = strPath.TrimEnd('\\');


            int nCount = channels * height * width;


            for (int n = 0; n < num; n++)

            {

                int nIdx = n * nCount;

                Datum d = ImageData.GetImageData<T>(rgData, channels, height, width, false, nIdx, nCount);

                Image img = ImageData.GetImage(d);


                int nLabel = (int)(float)Convert.ChangeType(rgLabels[n], typeof(float));


                string strName = strPath + "\\img_" + n.ToString() + "_label_" + nLabel.ToString() + ".png";

                img.Save(strName, System.Drawing.Imaging.ImageFormat.Png);


                img.Dispose();

            }

        }


#pragma warning restore 1591


        public Blob<T> Resize(List<int> rgShape)

        {

            m_log.CHECK_EQ(num_axes, rgShape.Count, "When resizing, the new shape must have the same number of axes as the blob to be resized.");

            m_log.CHECK_EQ(num_axes, 4, "Resizing only allowed on 4 axis blobs.");

            m_log.CHECK_EQ(num, rgShape[0], "Resizing only allowed on the last two axes.");

            m_log.CHECK_EQ(channels, rgShape[1], "Resizing only allowed on the last two axes.");


            T[] rgData = mutable_cpu_data;

            float[] rgDataF = Utility.ConvertVecF<T>(rgData);


            Blob<T> newBlob = Clone();

            newBlob.Reshape(rgShape);


            T[] rgDataNew = newBlob.mutable_cpu_data;

            float[] rgDataNewF = Utility.ConvertVecF<T>(rgDataNew);


            Bitmap bmp = new Bitmap(width, height);


            for (int n = 0; n < num; n++)

            {

                for (int c = 0; c < channels; c++)

                {

                    float fMin = float.MaxValue;

                    float fMax = -float.MaxValue;

                    int nH = height;

                    int nW = width;

                    int nSize = nH * nW;


                    for (int y = 0; y < nH; y++)

                    {

                        for (int x = 0; x < nW; x++)

                        {

                            int nIdx = n * (channels * nSize) + c * nSize + y * nW + x;

                            float fVal = rgDataF[nIdx];


                            if (fVal < fMin)

                                fMin = fVal;


                            if (fVal > fMax)

                                fMax = fVal;

                        }

                    }


                    for (int y = 0; y < nH; y++)

                    {

                        for (int x = 0; x < nW; x++)

                        {

                            int nIdx = n * (channels * nSize) + c * nSize + y * nW + x;

                            float fVal = rgDataF[nIdx];


                            fVal = ((fVal - fMin) / (fMax - fMin)) * 255.0f;    // move into range 0,255


                            bmp.SetPixel(x, y, Color.FromArgb((int)fVal, (int)fVal, (int)fVal));

                        }

                    }


                    Bitmap bmpNew = ImageTools.ResizeImage(bmp, newBlob.width, newBlob.height);


                    nH = newBlob.height;

                    nW = newBlob.width;

                    nSize = nH * nW;


                    for (int y = 0; y < nH; y++)

                    {

                        for (int x = 0; x < nW; x++)

                        {

                            int nIdx = n * (channels * nSize) + c * nSize + y * nW + x;


                            Color clr = bmpNew.GetPixel(x, y);

                            float fVal = ((clr.R / 255.0f) * (fMax - fMin)) + fMin; // move back to original range.


                            rgDataNewF[nIdx] = fVal;

                        }

                    }


                    bmpNew.Dispose();

                }

            }


            bmp.Dispose();

            newBlob.mutable_cpu_data = Utility.ConvertVec<T>(rgDataNewF);


            return newBlob;

        }


        public void NormalizeData(double? dfMean = null, double? dfStd = null)

        {

            if (!dfMean.HasValue || !dfStd.HasValue)

            {

                float[] rgF = Utility.ConvertVecF<T>(update_cpu_data());


                dfMean = mean(rgF);

                dfStd = std(dfMean.Value, rgF);

            }


            if (dfMean.Value != 0)

                m_cuda.add_scalar(count(), -1 * dfMean.Value, mutable_gpu_data);


            if (dfStd.Value != 0 && dfStd.Value != 1.0)

                m_cuda.mul_scalar(count(), 1.0 / dfStd.Value, mutable_gpu_data);

        }


        public double mean(float[] rgDf = null, bool bDiff = false)

        {

            double dfSum = 0;


            if (rgDf == null)

                rgDf = Utility.ConvertVecF<T>((bDiff) ? update_cpu_diff() : update_cpu_data());


            for (int i = 0; i < rgDf.Length; i++)

            {

                dfSum += rgDf[i];

            }


            return dfSum / rgDf.Length;

        }


        public double sum(float[] rgDf = null, bool bDiff = false)

        {

            double dfSum = 0;


            if (rgDf == null)

                rgDf = Utility.ConvertVecF<T>((bDiff) ? update_cpu_diff() : update_cpu_data());


            for (int i = 0; i < rgDf.Length; i++)

            {

                dfSum += rgDf[i];

            }


            return dfSum;

        }


        public double std(double? dfMean = null, float[] rgDf = null)

        {

            double dfSum = 0;


            if (rgDf == null)

                rgDf = Utility.ConvertVecF<T>(update_cpu_data());


            if (!dfMean.HasValue)

                dfMean = mean(rgDf);


            for (int i = 0; i < rgDf.Length; i++)

            {

                dfSum += Math.Pow(rgDf[i] - dfMean.Value, 2);

            }


            return Math.Sqrt(dfSum / rgDf.Length);

        }


        public Tuple<T, T, T> SetPixel(int nX, int nY, byte R, byte G, byte B, TransformationParameter.COLOR_ORDER order = TransformationParameter.COLOR_ORDER.RGB)

        {

            int nDim = width * height;

            int nIdxR = nY * width + nX;

            int nIdxG = nDim + nIdxR;

            int nIdxB = nDim + nDim + nIdxR;


            if (order == TransformationParameter.COLOR_ORDER.BGR)

            {

                int nTemp = nIdxB;

                nIdxB = nIdxR;

                nIdxR = nTemp;

            }


            T fR = Utility.ConvertVal<T>((double)R);

            T fG = Utility.ConvertVal<T>((double)G);

            T fB = Utility.ConvertVal<T>((double)B);


            T[] rg = m_cuda.SetPixel(mutable_gpu_data, count(), true, 0, new Tuple<int, T>(nIdxR, fR), new Tuple<int, T>(nIdxG, fG), new Tuple<int, T>(nIdxB, fB));


            return new Tuple<T, T, T>(rg[0], rg[1], rg[2]);

        }


        public Tuple<T, T, T> SetPixel(int nX, int nY, Tuple<T, T, T> pixel, bool bReturnOriginal = false, TransformationParameter.COLOR_ORDER order = TransformationParameter.COLOR_ORDER.RGB, int nOffset = 0)

        {

            int nDim = width * height;

            int nIdxR = nY * width + nX;

            int nIdxG = nDim + nIdxR;

            int nIdxB = nDim + nDim + nIdxR;


            if (order == TransformationParameter.COLOR_ORDER.BGR)

            {

                int nTemp = nIdxB;

                nIdxB = nIdxR;

                nIdxR = nTemp;

            }


            T fR = pixel.Item1;

            T fG = pixel.Item2;

            T fB = pixel.Item3;


            if (bReturnOriginal)

            {

                T[] rg = m_cuda.SetPixel(mutable_gpu_data, count(), true, nOffset, new Tuple<int, T>(nIdxR, fR), new Tuple<int, T>(nIdxG, fG), new Tuple<int, T>(nIdxB, fB));

                return new Tuple<T, T, T>(rg[0], rg[1], rg[2]);

            }

            else

            {

                m_cuda.SetPixel(mutable_gpu_data, count(), true, nOffset, new Tuple<int, T>(nIdxR, fR), new Tuple<int, T>(nIdxG, fG), new Tuple<int, T>(nIdxB, fB));

                return null;

            }

        }


        public void SaveToImage(string strFile, bool bNonZeroExistOnly = true, bool bSaveDiff = false, Dictionary<float, Color> rgSpecialValues = null)

        {

            Blob<T> blobWork = new Blob<T>(m_cuda, m_log);

            float[] rgData;

            double dfMin = 1;

            double dfMax = 1;

            int nWid = width;

            int nHt = height;

            int nNumY = num;

            int nNumX = channels;


            try

            {

                blobWork.ReshapeLike(this);


                if (bSaveDiff)

                {

                    rgData = Utility.ConvertVecF<T>(mutable_cpu_diff);


                    if (!bNonZeroExistOnly)

                    {

                        Tuple<double, double, double, double> minmax = minmax_diff(blobWork);

                        dfMin = minmax.Item1;

                        dfMax = minmax.Item2;

                    }

                }

                else

                {

                    rgData = Utility.ConvertVecF<T>(mutable_cpu_data);


                    if (!bNonZeroExistOnly)

                    {

                        Tuple<double, double, double, double> minmax = minmax_data(blobWork);

                        dfMin = minmax.Item1;

                        dfMax = minmax.Item2;

                    }

                }


                if (nWid == 1 && nHt == 1)

                {

                    nNumX = 1;

                    nNumY = 1;

                    nHt = num;

                    nWid = channels;

                }

                else if (nWid == 1)

                {

                    nNumY = num;

                    nNumX = 1;

                    nWid = height;

                    nHt = channels;

                }


                Bitmap bmp = new Bitmap(nNumX * nWid + (nNumX - 1), nNumY * nHt + (nNumY - 1));

                using (Graphics g = Graphics.FromImage(bmp))

                {

                    g.FillRectangle(Brushes.Black, 0, 0, bmp.Width, bmp.Height);

                }


                LockBitmap bmp1 = new LockBitmap(bmp);

                bmp1.LockBits();


                int nX = 0;

                int nY = 0;

                int nX1 = 0;

                int nY1 = 0;


                for (int y = 0; y < nNumY; y++)

                {

                    for (int x = 0; x < nNumX; x++)

                    {

                        for (int h = 0; h < nHt; h++)

                        {

                            for (int w = 0; w < nWid; w++)

                            {

                                int nIdx = y *  nNumX * nHt * nWid + x * nHt * nWid + h * nWid + w;

                                float fVal = rgData[nIdx];

                                Color clr = Color.Empty;


                                if (rgSpecialValues != null && rgSpecialValues.ContainsKey(fVal))

                                {

                                    clr = rgSpecialValues[fVal];

                                }

                                else if (fVal < 0)

                                {

                                    if (bNonZeroExistOnly)

                                    {

                                        clr = Color.White;

                                    }

                                    else

                                    {

                                        int nClr = (int)(255 * (rgData[nIdx] - dfMin) / (0 - dfMin));

                                        clr = Color.FromArgb(nClr, 0, 0);

                                    }

                                }

                                else if (fVal > 0)

                                {

                                    if (bNonZeroExistOnly)

                                    {

                                        clr = Color.White;

                                    }

                                    else

                                    {

                                        int nClr = (int)(255 * (rgData[nIdx] - 0) / (dfMax - 0));

                                        clr = Color.FromArgb(0, nClr, 0);

                                    }

                                }


                                if (!clr.IsEmpty)

                                    bmp1.SetPixel(nX1, nY1, clr);


                                nX1++;

                            }


                            nX1 = nX;

                            nY1++;

                        }


                        nX += nWid + 1;

                        nX1 = nX;

                        nY1 = nY;

                    }


                    nX = 0;

                    nY += nHt + 1;

                    nY1 = nY;

                }


                bmp1.UnlockBits();

                bmp.Save(strFile);

            }

            finally

            {

                blobWork.Dispose();

            }

        }


        private void drawImage(Blob<T> b, string strFile)

        {

        }


        public void SaveToNumpy(string strFile, bool bSaveDiff = false)

        {

            using (FileStream fs = File.Open(strFile, FileMode.Create))

            using (BinaryWriter bw = new BinaryWriter(fs))

            {

                bw.Write((byte)0x93);

                bw.Write((byte)0x4E); // N

                bw.Write((byte)0x55); // U

                bw.Write((byte)0x4D); // M

                bw.Write((byte)0x50); // P

                bw.Write((byte)0x59); // Y

                bw.Write((byte)0x01);

                bw.Write((byte)0x00);


                string strHeader = "{'descr': '<f4', 'fortran_order': False, 'shape': (";

                for (int i = 0; i < shape().Count; i++)

                {

                    strHeader += shape(i).ToString() + ",";

                }


                strHeader = strHeader.TrimEnd(',');

                strHeader += ")";

                strHeader += ", }";

                strHeader = strHeader.PadRight(117, ' ');

                strHeader += "\n";


                byte bLen = (byte)strHeader.Length;

                bw.Write(bLen);

                bw.Write((byte)0x00);


                foreach (char ch in strHeader)

                {

                    bw.Write((byte)ch);

                }


                float[] rgData;

                if (bSaveDiff)

                    rgData = Utility.ConvertVecF<T>(mutable_cpu_diff);

                else

                    rgData = Utility.ConvertVecF<T>(mutable_cpu_data);


                for (int i = 0; i < rgData.Length; i++)

                {

                    bw.Write(rgData[i]);

                }

            }

        }


        public static void SaveToNumpy(string strFile, float[] rgData, int[] rgShape)

        {

            using (FileStream fs = File.Open(strFile, FileMode.Create))

            using (BinaryWriter bw = new BinaryWriter(fs))

            {

                bw.Write((byte)0x93);

                bw.Write((byte)0x4E); // N

                bw.Write((byte)0x55); // U

                bw.Write((byte)0x4D); // M

                bw.Write((byte)0x50); // P

                bw.Write((byte)0x59); // Y

                bw.Write((byte)0x01);

                bw.Write((byte)0x00);


                string strHeader = "{'descr': '<f4', 'fortran_order': False, 'shape': (";

                for (int i = 0; i < rgShape.Length; i++)

                {

                    strHeader += rgShape[i].ToString() + ",";

                }


                strHeader = strHeader.TrimEnd(',');

                strHeader += ")";

                strHeader += ", }";

                strHeader = strHeader.PadRight(117, ' ');

                strHeader += "\n";


                byte bLen = (byte)strHeader.Length;

                bw.Write(bLen);

                bw.Write((byte)0x00);


                foreach (char ch in strHeader)

                {

                    bw.Write((byte)ch);

                }


                for (int i = 0; i < rgData.Length; i++)

                {

                    bw.Write(rgData[i]);

                }

            }

        }


        public static void SaveToNumpy(string strFile, int[] rgData, int[] rgShape)

        {

            using (FileStream fs = File.Open(strFile, FileMode.Create))

            using (BinaryWriter bw = new BinaryWriter(fs))

            {

                bw.Write((byte)0x93);

                bw.Write((byte)0x4E); // N

                bw.Write((byte)0x55); // U

                bw.Write((byte)0x4D); // M

                bw.Write((byte)0x50); // P

                bw.Write((byte)0x59); // Y

                bw.Write((byte)0x01);

                bw.Write((byte)0x00);


                string strHeader = "{'descr': '<i4', 'fortran_order': False, 'shape': (";

                for (int i = 0; i < rgShape.Length; i++)

                {

                    strHeader += rgShape[i].ToString() + ",";

                }


                strHeader = strHeader.TrimEnd(',');

                strHeader += ")";

                strHeader += ", }";

                strHeader = strHeader.PadRight(117, ' ');

                strHeader += "\n";


                byte bLen = (byte)strHeader.Length;

                bw.Write(bLen);

                bw.Write((byte)0x00);


                foreach (char ch in strHeader)

                {

                    bw.Write((byte)ch);

                }


                for (int i = 0; i < rgData.Length; i++)

                {

                    bw.Write(rgData[i]);

                }

            }

        }


        public static void SaveToNumpy(string strFile, long[] rgData, int[] rgShape)

        {

            using (FileStream fs = File.Open(strFile, FileMode.Create))

            using (BinaryWriter bw = new BinaryWriter(fs))

            {

                bw.Write((byte)0x93);

                bw.Write((byte)0x4E); // N

                bw.Write((byte)0x55); // U

                bw.Write((byte)0x4D); // M

                bw.Write((byte)0x50); // P

                bw.Write((byte)0x59); // Y

                bw.Write((byte)0x01);

                bw.Write((byte)0x00);


                string strHeader = "{'descr': '<i8', 'fortran_order': False, 'shape': (";

                for (int i = 0; i < rgShape.Length; i++)

                {

                    strHeader += rgShape[i].ToString() + ",";

                }


                strHeader = strHeader.TrimEnd(',');

                strHeader += ")";

                strHeader += ", }";

                strHeader = strHeader.PadRight(117, ' ');

                strHeader += "\n";


                byte bLen = (byte)strHeader.Length;

                bw.Write(bLen);

                bw.Write((byte)0x00);


                foreach (char ch in strHeader)

                {

                    bw.Write((byte)ch);

                }


                for (int i = 0; i < rgData.Length; i++)

                {

                    bw.Write(rgData[i]);

                }

            }

        }


        public Tuple<float[], int[]> LoadFromNumpy(string strFile, bool bLoadDiff = false, bool bLoadDataOnly = false, Log log = null, int nMax = int.MaxValue)

        {

            using (FileStream fs = File.OpenRead(strFile))

            using (BinaryReader br = new BinaryReader(fs))

            {

                byte[] rgMagic = new byte[6];

                for (int i = 0; i < rgMagic.Length; i++)

                {

                    rgMagic[i] = br.ReadByte();

                }


                if (rgMagic[0] != 0x93 || rgMagic[1] != 0x4E || rgMagic[2] != 0x55 || rgMagic[3] != 0x4D || rgMagic[4] != 0x50 || rgMagic[5] != 0x59)

                    throw new Exception("The file is not a valid Numpy file!");


                byte bMajor = br.ReadByte();

                byte bMinor = br.ReadByte();


                if (bMajor != 1 || bMinor != 0)

                    throw new Exception("The file is not a valid Numpy file!");


                byte bHeaderLen1 = br.ReadByte();

                byte bHeaderLen2 = br.ReadByte();

                int nHeaderLen = bHeaderLen2 << 8 | bHeaderLen1;


                byte[] rgHeader = new byte[nHeaderLen];

                for (int i = 0; i < rgHeader.Length; i++)

                {

                    rgHeader[i] = br.ReadByte();

                }

                string strHeader = Encoding.ASCII.GetString(rgHeader);


                bool bFortranOrder;

                int[] rgShape;

                Type dataType;

                int nCount = parseHeader(strHeader, out bFortranOrder, out rgShape, out dataType, nMax);

                if (nCount < 0)

                    throw new Exception("The file size is too large for a flat array.");


                if (bFortranOrder)

                    throw new Exception("Currently the fortran ordering is not supported");


                Stopwatch sw = null;

                if (log != null)

                {

                    sw = new Stopwatch();

                    sw.Start();

                }


                float[] rgData = new float[nCount];

                for (int i = 0; i < rgData.Length; i++)

                {

                    if (dataType == typeof(float))

                        rgData[i] = br.ReadSingle();

                    else if (dataType == typeof(double))

                        rgData[i] = (float)br.ReadDouble();

                    else if (dataType == typeof(int))

                        rgData[i] = (float)br.ReadInt32();

                    else if (dataType == typeof(long))

                        rgData[i] = (float)br.ReadInt64();

                    else if (dataType == typeof(bool))

                        rgData[i] = (br.ReadBoolean()) ? 1 : 0;

                    else

                        throw new Exception("Unsupported data type!");


                    if (log != null)

                    {

                        if (sw.Elapsed.TotalMilliseconds > 1000)

                        {

                            double dfPct = (double)i / (double)rgData.Length;

                            string strOut = "Loading '" + strFile + "' at " + dfPct.ToString("P5") + "...";

                            log.WriteLine(strOut, true);

                            sw.Restart();

                        }

                    }

                }


                if (!bLoadDataOnly)

                {

                    Reshape(rgShape);


                    if (bLoadDiff)

                        mutable_cpu_diff = Utility.ConvertVec<T>(rgData);

                    else

                        mutable_cpu_data = Utility.ConvertVec<T>(rgData);

                }


                return new Tuple<float[], int[]>(rgData, rgShape);

            }

        }


        public static Tuple<List<float[]>, int[], List<string>> LoadFromNumpy(string strFile, Log log = null, int nMax = int.MaxValue, int nStartIdx = 0, int nCount = int.MaxValue)

        {

            using (FileStream fs = File.OpenRead(strFile))

            using (BinaryReader br = new BinaryReader(fs))

            {

                byte[] rgMagic = new byte[6];

                for (int i = 0; i < rgMagic.Length; i++)

                {

                    rgMagic[i] = br.ReadByte();

                }


                if (rgMagic[0] != 0x93 || rgMagic[1] != 0x4E || rgMagic[2] != 0x55 || rgMagic[3] != 0x4D || rgMagic[4] != 0x50 || rgMagic[5] != 0x59)

                    throw new Exception("The file is not a valid Numpy file!");


                byte bMajor = br.ReadByte();

                byte bMinor = br.ReadByte();


                if (bMajor != 1 || bMinor != 0)

                    throw new Exception("The file is not a valid Numpy file!");


                byte bHeaderLen1 = br.ReadByte();

                byte bHeaderLen2 = br.ReadByte();

                int nHeaderLen = bHeaderLen2 << 8 | bHeaderLen1;


                byte[] rgHeader = new byte[nHeaderLen];

                for (int i = 0; i < rgHeader.Length; i++)

                {

                    rgHeader[i] = br.ReadByte();

                }

                string strHeader = Encoding.ASCII.GetString(rgHeader);


                bool bFortranOrder;

                int[] rgShape;

                Type dataType;

                int nDataTypeSize;

                Tuple<int,int> count = parseHeaderEx(strHeader, out bFortranOrder, out rgShape, out dataType, out nDataTypeSize, nMax);


                if (bFortranOrder)

                    throw new Exception("Currently the fortran ordering is not supported");


                Stopwatch sw = null;

                if (log != null)

                {

                    sw = new Stopwatch();

                    sw.Start();

                }


                string strVal;

                ulong ulIdx = 0;


                if (nCount == int.MaxValue)

                {

                    nCount = count.Item1;

                }

                else

                {

                    if (nStartIdx + nCount > count.Item1)

                    {

                        nCount = count.Item1 - nStartIdx;


                        if (nCount < 0)

                            nCount = 0;

                    }


                    rgShape[0] = nCount;

                }


                // Skip ahead to start index (if greater than zero).

                if (nStartIdx > 0)

                {

                    long nSeekPos = fs.Position;

                    long nItemSize = 0;

                    long nItems = 1;


                    for (int i = 1; i < rgShape.Length; i++)

                    {

                        nItems *= rgShape[i];

                    }


                    if (nItems > 0)

                    {

                        if (dataType == typeof(float))

                            nItemSize = sizeof(float);

                        else if (dataType == typeof(double))

                            nItemSize = sizeof(double);

                        else if (dataType == typeof(int))

                            nItemSize = sizeof(int);

                        else if (dataType == typeof(string))

                        {

                            if (nStartIdx > 0)

                                throw new Exception("String data types do not support starting at an index > 0!");

                        }

                        else if (dataType == typeof(long))

                            nItemSize = sizeof(long);

                        else if (dataType == typeof(bool))

                            nItemSize = sizeof(bool);

                        else

                            throw new Exception("Unsupported data type!");


                        nSeekPos += nItemSize * nItems * nStartIdx;


                        fs.Seek(nSeekPos, SeekOrigin.Begin);

                    }

                }


                ulong ulTotal = (ulong)nCount * (ulong)count.Item2;

                List<float[]> rgData = new List<float[]>(nCount);

                List<string> rgStrData = new List<string>(nCount);

                if (ulTotal > 0)

                {

                    for (int i = nStartIdx; i < nStartIdx + nCount && i < count.Item1; i++)

                    {

                        float[] rgItem = new float[count.Item2];

                        for (int j = 0; j < count.Item2; j++)

                        {

                            if (dataType == typeof(float))

                                rgItem[j] = br.ReadSingle();

                            else if (dataType == typeof(double))

                                rgItem[j] = (float)br.ReadDouble();

                            else if (dataType == typeof(int))

                                rgItem[j] = (float)br.ReadInt32();

                            else if (dataType == typeof(string))

                            {

                                List<byte> bytes = new List<byte>();

                                byte addByte = 0x00;

                                for (int c = 0; c < nDataTypeSize * 4; c++)

                                {

                                    addByte = br.ReadByte();

                                    if (addByte != 0x00)

                                        bytes.Add(addByte);

                                }

                                strVal = Encoding.UTF8.GetString(bytes.ToArray());

                                rgStrData.Add(strVal);

                            }

                            else if (dataType == typeof(long))

                                rgItem[j] = (float)br.ReadInt64();

                            else if (dataType == typeof(bool))

                                rgItem[j] = (br.ReadBoolean()) ? 1 : 0;

                            else

                                throw new Exception("Unsupported data type!");


                            if (log != null)

                            {

                                if (sw.Elapsed.TotalMilliseconds > 1000)

                                {

                                    double dfPct = (double)ulIdx / (double)ulTotal;

                                    string strOut = "Loading '" + strFile + "' at " + dfPct.ToString("P5") + "...";

                                    log.WriteLine(strOut, true);

                                    sw.Restart();

                                }

                            }

                            ulIdx++;

                        }


                        rgData.Add(rgItem);

                    }

                }


                return new Tuple<List<float[]>, int[], List<string>>(rgData, rgShape, rgStrData);

            }

        }


        private int parseHeader(string str, out bool bFortranOrder, out int[] rgShape, out Type dataType, int nMax = int.MaxValue)

        {

            int nCount = 1;

            List<int> rgShape1 = new List<int>();

            str = str.Trim('{', '}', ' ', '\n', ',');


            dataType = typeof(object);


            string strShape = null;

            string strTarget = "'shape':";

            int nPos = str.IndexOf(strTarget);

            if (nPos > 0)

            {

                strShape = str.Substring(nPos + strTarget.Length);

                str = str.Substring(0, nPos);


                nPos = strShape.IndexOf(')');

                str += strShape.Substring(nPos + 1);

                str = str.Trim(',', ' ');


                strShape = strShape.Substring(0, nPos);

                strShape = strShape.Trim(' ', '(', ')');

                string[] rgShapeStr = strShape.Split(',');


                for (int i=0; i<rgShapeStr.Length; i++)

                {

                    string strShape1 = rgShapeStr[i];

                    if (!string.IsNullOrEmpty(strShape1))

                    {

                        int nShape = int.Parse(strShape1);


                        if (i == 0 && nShape > nMax)

                            nShape = nMax;


                        rgShape1.Add(nShape);

                        nCount *= rgShape1[rgShape1.Count - 1];

                    }

                }

            }


            rgShape = rgShape1.ToArray();

            bFortranOrder = false;


            string[] rgstr = str.Split(',');

            foreach (string str1 in rgstr)

            {

                string[] rgstrKeyVal = str1.Split(':');

                if (rgstrKeyVal.Length != 2)

                    throw new Exception("Invalid header key value, '" + str1 + "'!");


                string strKey = rgstrKeyVal[0].Trim('\'', ' ');

                string strVal = rgstrKeyVal[1].Trim('\'', ' ');


                switch (strKey)

                {

                    case "descr":

                        if (strVal == "<f4")

                            dataType = typeof(float);

                        else if (strVal == "<f8")

                            dataType = typeof(double);

                        else if (strVal == "<i4")

                            dataType = typeof(int);

                        else if (strVal == "<i8")

                            dataType = typeof(long);

                        else if (strVal == "|b1")

                            dataType = typeof(bool);

                        else

                            throw new Exception("Unsupported data type '" + strVal + "', currenly only support '<f4'");

                        break;


                    case "fortran_order":

                        bFortranOrder = bool.Parse(strVal);

                        break;

                }

            }


            return nCount;

        }


        private static Tuple<int, int> parseHeaderEx(string str, out bool bFortranOrder, out int[] rgShape, out Type dataType, out int nDataTypeSize, int nMax = int.MaxValue)

        {

            int nNum = 1;

            int nCount = 1;

            List<int> rgShape1 = new List<int>();

            str = str.Trim('{', '}', ' ', '\n', ',');


            dataType = typeof(object);

            nDataTypeSize = 1;


            string strShape = null;

            string strTarget = "'shape':";

            int nPos = str.IndexOf(strTarget);

            if (nPos > 0)

            {

                strShape = str.Substring(nPos + strTarget.Length);

                str = str.Substring(0, nPos);


                nPos = strShape.IndexOf(')');

                str += strShape.Substring(nPos + 1);

                str = str.Trim(',', ' ');


                strShape = strShape.Substring(0, nPos);

                strShape = strShape.Trim(' ', '(', ')');

                string[] rgShapeStr = strShape.Split(',');


                for (int i=0; i<rgShapeStr.Count(); i++)

                {

                    string strShape1 = rgShapeStr[i];

                    if (!string.IsNullOrEmpty(strShape1))

                    {

                        int nShape = int.Parse(strShape1);


                        if (i == 0 && nShape > nMax)

                            nShape = nMax;


                        rgShape1.Add(nShape);


                        if (i == 0)

                            nNum = rgShape1[rgShape1.Count - 1];

                        else

                            nCount *= rgShape1[rgShape1.Count - 1];

                    }

                }

            }


            rgShape = rgShape1.ToArray();

            bFortranOrder = false;


            string[] rgstr = str.Split(',');

            foreach (string str1 in rgstr)

            {

                string[] rgstrKeyVal = str1.Split(':');

                if (rgstrKeyVal.Length != 2)

                    throw new Exception("Invalid header key value, '" + str1 + "'!");


                string strKey = rgstrKeyVal[0].Trim('\'', ' ');

                string strVal = rgstrKeyVal[1].Trim('\'', ' ');


                switch (strKey)

                {

                    case "descr":

                        if (strVal == "<f4")

                            dataType = typeof(float);

                        else if (strVal == "<f8")

                            dataType = typeof(double);

                        else if (strVal == "<i4")

                            dataType = typeof(int);

                        else if (strVal == "<i8")

                            dataType = typeof(long);

                        else if (strVal == "|b1")

                            dataType = typeof(bool);

                        else if (strVal.StartsWith("<U"))

                        {

                            strVal = strVal.Substring(2);

                            nDataTypeSize = int.Parse(strVal);

                            dataType = typeof(string);

                        }

                        else

                            throw new Exception("Unsupported data type '" + strVal + "', currenly only support '<f4'");

                        break;


                    case "fortran_order":

                        bFortranOrder = bool.Parse(strVal);

                        break;

                }

            }


            return new Tuple<int, int>(nNum, nCount);

        }


        public void MatMul(Blob<T> blobA, Blob<T> blobB, bool bReshape = false, bool bTransA = false, bool bTransB = false, double dfScale = 1.0, bool bADiff = false, bool bBDiff = false, bool bCDiff = false)

        {

            m_log.CHECK_EQ(blobA.num_axes, 4, "The blobA must have 4 axes!");

            m_log.CHECK_EQ(blobB.num_axes, 4, "The blobB must have 4 axes!");


            if (bADiff && blobA.gpu_diff == 0)

                m_log.FAIL("Blob A does not have a diff value!");

            if (bBDiff && blobB.gpu_diff == 0)

                m_log.FAIL("Blob B does not have a diff value!");


            for (int i = 0; i < blobA.num_axes - 2; i++)

            {

                m_log.CHECK_EQ(blobA.shape(i), blobB.shape(i), "Blob A and B must have the same shape at axis '" + i.ToString() + "'!");

            }


            if (bCDiff && gpu_diff == 0)

                m_log.FAIL("This blob does not have a diff value!");


            int nAxis = 2;

            uint nOuterCount = (uint)blobA.count(0, nAxis);

            int m = blobA.shape(2);

            int n = blobB.shape(3);

            int k = blobA.shape(3);


            // Reshape the resulting blob to shape (B,C,M,N)

            List<int> rgShape = Utility.Clone<int>(blobA.shape());

            rgShape[rgShape.Count - 1] = n;

            rgShape[rgShape.Count - 2] = m;


            if (bReshape)

                Reshape(rgShape);

            else

                m_log.CHECK(CompareShape(rgShape), "This (resulting) blob does not have the correct shape!  Expected shape = " + Utility.ToString<int>(rgShape));


            long hA = (bADiff) ? blobA.gpu_diff : blobA.gpu_data;

            long hB = (bBDiff) ? blobB.gpu_diff : blobB.gpu_data;

            long hC = (bCDiff) ? mutable_gpu_diff : mutable_gpu_data;


            m_cuda.matmul(nOuterCount, m, n, k, hA, hB, hC, dfScale, bTransA, bTransB);

        }


        public void MatMulGrad(Blob<T> blobA, Blob<T> blobB, Blob<T> blobWork, double dfScale = 1.0)

        {

            if (dfScale != 1.0)

                scale_diff(dfScale);

            blobWork.CopyFromAndTransposeHeightWidth(blobB, false);

            blobA.MatMul(this, blobWork, false, false, false, 1, true, false, true);

            blobWork.CopyFromAndTransposeHeightWidth(blobA, false);

            blobB.MatMul(blobWork, this, false, false, false, 1, false, true, true);

        }


        public void Percentile(Blob<T> blobY, double dfPercentile)

        {

            List<int> rgShape = Utility.Clone<int>(shape());

            rgShape[0] = 1;

            blobY.Reshape(rgShape);


            m_cuda.channel_percentile(m_nCount, num, channels, count(2), gpu_data, blobY.mutable_gpu_data, dfPercentile);

        }

    }

}

MyCaffe.basecode.Datum
The Datum class is a simple wrapper to the SimpleDatum class to ensure compatibility with the origina...
Definition: Datum.cs:12

MyCaffe.basecode.ImageData
The ImageData class is a helper class used to convert between Datum, other raw data,...
Definition: ImageData.cs:14

MyCaffe.basecode.ImageData.GetImageData
static Datum GetImageData(Bitmap bmp, SimpleDatum sd, bool? bIsDataRealOverride=null, int[] rgFocusMap=null)
The GetImageData function converts a Bitmap into a Datum.
Definition: ImageData.cs:23

MyCaffe.basecode.ImageData.GetImage
static Bitmap GetImage(SimpleDatum d, ColorMapper clrMap=null, List< int > rgClrOrder=null)
Converts a SimplDatum (or Datum) into an image, optionally using a ColorMapper.
Definition: ImageData.cs:506

MyCaffe.basecode.ImageTools
The ImageTools class is a helper class used to manipulate image data.
Definition: ImageTools.cs:16

MyCaffe.basecode.ImageTools.ResizeImage
static Bitmap ResizeImage(Image image, int width, int height)
Resize the image to the specified width and height.
Definition: ImageTools.cs:39

MyCaffe.basecode.LockBitmap
The LockBitmap class provides very efficient SetPixel and GetPixel functionality of a bitmap by using...
Definition: LockBitmap.cs:21

MyCaffe.basecode.LockBitmap.SetPixel
void SetPixel(int x, int y, Color color)
Set the color of the specified pixel
Definition: LockBitmap.cs:164

MyCaffe.basecode.LockBitmap.UnlockBits
void UnlockBits()
Unlock bitmap data, releasing its underlying data.
Definition: LockBitmap.cs:99

MyCaffe.basecode.LockBitmap.LockBits
void LockBits()
Lock bitmap data to access its underlying raw data.
Definition: LockBitmap.cs:55

MyCaffe.basecode.Log
The Log class provides general output in text form.
Definition: Log.cs:13

MyCaffe.basecode.Log.CHECK
void CHECK(bool b, string str)
Test a flag for true.
Definition: Log.cs:227

MyCaffe.basecode.Log.WriteLine
void WriteLine(string str, bool bOverrideEnabled=false, bool bHeader=false, bool bError=false, bool bDisable=false)
Write a line of output.
Definition: Log.cs:80

MyCaffe.basecode.Log.FAIL
void FAIL(string str)
Causes a failure which throws an exception with the desciptive text.
Definition: Log.cs:394

MyCaffe.basecode.Log.CHECK_EQ
void CHECK_EQ(double df1, double df2, string str)
Test whether one number is equal to another.
Definition: Log.cs:239

MyCaffe.basecode.Log.CHECK_LE
void CHECK_LE(double df1, double df2, string str)
Test whether one number is less than or equal to another.
Definition: Log.cs:263

MyCaffe.basecode.Log.CHECK_GE
void CHECK_GE(double df1, double df2, string str)
Test whether one number is greater than or equal to another.
Definition: Log.cs:287

MyCaffe.basecode.Log.CHECK_LT
void CHECK_LT(double df1, double df2, string str)
Test whether one number is less than another.
Definition: Log.cs:275

MyCaffe.basecode.SimpleDatum
The SimpleDatum class holds a data input within host memory.
Definition: SimpleDatum.cs:161

MyCaffe.basecode.SimpleDatum.Channels
int Channels
Return the number of channels of the data.
Definition: SimpleDatum.cs:2296

MyCaffe.basecode.SimpleDatum.Width
int Width
Return the width of the data.
Definition: SimpleDatum.cs:2288

MyCaffe.basecode.SimpleDatum.Index
int Index
Returns the index of the SimpleDatum.
Definition: SimpleDatum.cs:2245

MyCaffe.basecode.SimpleDatum.Height
int Height
Return the height of the data.
Definition: SimpleDatum.cs:2280

MyCaffe.basecode.Utility
The Utility class provides general utility funtions.
Definition: Utility.cs:35

MyCaffe.basecode.Utility.CanonicalAxisIndex
static int CanonicalAxisIndex(int nIdx, int nNumAxes)
Returns the 'canonical' version of a (usually) user-specified axis, allowing for negative indexing (e...
Definition: Utility.cs:50

MyCaffe.basecode.Utility.Count
static int Count(List< int > rgShape, int nStartIdx=0, int nEndIdx=-1)
Return the count of items given the shape.
Definition: Utility.cs:83

MyCaffe.basecode.Utility.ConvertVec
static double[] ConvertVec(float[] rgf)
Convert an array of float to an array of generics.
Definition: Utility.cs:550

MyCaffe.common.Blob
The Blob is the main holder of data that moves through the Layers of the Net.
Definition: Blob.cs:25

MyCaffe.common.Blob.MathDiv
Blob< T > MathDiv(T fScale)
Clones the input Blob and divides a scalar from all of the clones data items.
Definition: Blob.cs:2264

MyCaffe.common.Blob.Percentile
void Percentile(Blob< T > blobY, double dfPercentile)
Calculates the percentile and places the result in blobY.
Definition: Blob.cs:3992

MyCaffe.common.Blob.channels
int channels
DEPRECIATED; legacy shape accessor channels: use shape(1) instead.
Definition: Blob.cs:800

MyCaffe.common.Blob.Blob
Blob(CudaDnn< T > cuda, Log log, List< int > rgShape, bool bIncludeDiff=true, bool bUseHalfSize=false)
The Blob constructor.
Definition: Blob.cs:115

MyCaffe.common.Blob.sum
double sum(float[] rgDf=null, bool bDiff=false)
Calculate the sum of the blob data.
Definition: Blob.cs:2986

MyCaffe.common.Blob.SetData
void SetData(T[] rgData, int nCount=-1, bool bSetCount=true)
Sets a number of items within the Blob's data.
Definition: Blob.cs:1922

MyCaffe.common.Blob.ShareData
void ShareData(Blob< T > b)
Set the data to point to the data of the other blob – useful in Layers which simply perform a copy in...
Definition: Blob.cs:1813

MyCaffe.common.Blob.min_data
double min_data
Returns the minimum value in the data of the Blob.
Definition: Blob.cs:2499

MyCaffe.common.Blob.max_data
double max_data
Returns the maximum value in the data of the Blob.
Definition: Blob.cs:2525

MyCaffe.common.Blob.LegacyShape
int LegacyShape(int nIdx)
Returns the legacy shape at a given axis.
Definition: Blob.cs:825

MyCaffe.common.Blob.MatMul
void MatMul(Blob< T > blobA, Blob< T > blobB, bool bReshape=false, bool bTransA=false, bool bTransB=false, double dfScale=1.0, bool bADiff=false, bool bBDiff=false, bool bCDiff=false)
MatMul blobA with blobB and place the result in this blob (e.g. this = matmul(A, B))....
Definition: Blob.cs:3922

MyCaffe.common.Blob.height
int height
DEPRECIATED; legacy shape accessor height: use shape(2) instead.
Definition: Blob.cs:808

MyCaffe.common.Blob.Blob
Blob(CudaDnn< T > cuda, Log log, Blob< T > b, bool bUseHalfSize=false)
The Blob constructor.
Definition: Blob.cs:146

MyCaffe.common.Blob.count
int count(int nStartIdx)
Compute the volume of a slice spanning from a particular first axis to the final axis.
Definition: Blob.cs:768

MyCaffe.common.Blob.MatMulGrad
void MatMulGrad(Blob< T > blobA, Blob< T > blobB, Blob< T > blobWork, double dfScale=1.0)
Calculates and propagates the gradient for blobA and BlobB given the input gradient in this blob's di...
Definition: Blob.cs:3974

MyCaffe.common.Blob.count
int count(int nStartIdx, int nEndIdx)
Compute the volume of a slice; i.e., the product of dimensions among a range of axes.
Definition: Blob.cs:751

MyCaffe.common.Blob.Blob
Blob(CudaDnn< T > cuda, Log log, bool bIncludeDiff=true, bool bUseHalfSize=false)
The Blob constructor.
Definition: Blob.cs:64

MyCaffe.common.Blob.num_axes
int num_axes
Returns the number of axes in the Blob.
Definition: Blob.cs:705

MyCaffe.common.Blob.minmax_data
Tuple< double, double, double, double > minmax_data(Blob< T > work, bool bDetectNans=false, bool bUseChunks=false)
Returns the minimum and maximum values in the data of the Blob.
Definition: Blob.cs:2624

MyCaffe.common.Blob.GetParameter
double? GetParameter(string strName)
Get a blob parameter.
Definition: Blob.cs:220

MyCaffe.common.Blob.mutable_gpu_diff
long mutable_gpu_diff
Returns the diff GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1555

MyCaffe.common.Blob.SaveToImage
void SaveToImage(string strFile, bool bNonZeroExistOnly=true, bool bSaveDiff=false, Dictionary< float, Color > rgSpecialValues=null)
Save the Blob to an image where values less than 0 are colored red, and values greater than 0 are col...
Definition: Blob.cs:3105

MyCaffe.common.Blob.scale_diff
void scale_diff(T fScaleFactor)
Scale the blob diff by a constant factor.
Definition: Blob.cs:1791

MyCaffe.common.Blob.SetPixel
Tuple< T, T, T > SetPixel(int nX, int nY, Tuple< T, T, T > pixel, bool bReturnOriginal=false, TransformationParameter.COLOR_ORDER order=TransformationParameter.COLOR_ORDER.RGB, int nOffset=0)
Sets a pixel to the values within a three item tuple where the first item is assigned RED,...
Definition: Blob.cs:3068

MyCaffe.common.Blob.mutable_cpu_diff
T[] mutable_cpu_diff
Get diff from the GPU and bring it over to the host, or Set diff from the Host and send it over to th...
Definition: Blob.cs:1511

MyCaffe.common.Blob.GetDiff
T GetDiff(int nIdx)
Returns the diff at a given flat index within the Blob.
Definition: Blob.cs:1907

MyCaffe.common.Blob.CompareShape
bool CompareShape(int[] rgShape, bool bCompareCpuDataLen=false)
Compares the shape of this blob to another shape.
Definition: Blob.cs:2148

MyCaffe.common.Blob.data_at
T data_at(int n, int c, int h, int w)
Returns the data at a given location in the Blob.
Definition: Blob.cs:1394

MyCaffe.common.Blob.sumsq_diff
T sumsq_diff()
Calcualte the sum of squares (L2 norm squared) of the diff.
Definition: Blob.cs:1742

MyCaffe.common.Blob.mutable_gpu_data
long mutable_gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1487

MyCaffe.common.Blob.SetDiff
void SetDiff(double dfVal, int nStartIdx, int nCount)
Set a diff range with a given value.
Definition: Blob.cs:1998

MyCaffe.common.Blob.Share
void Share(Blob< T > b)
Share another Blob with this one, by setting the data and diff to the same data and diff of the other...
Definition: Blob.cs:1850

MyCaffe.common.Blob.Blob
Blob(CudaDnn< T > cuda, Log log, int nNum, int nChannels, int nHeight, int nWidth, bool bIncludeDiff=true, bool bUseHalfSize=false)
DEPRECIATED; use
Definition: Blob.cs:98

MyCaffe.common.Blob.Tag
object Tag
Returns a user defined object associated with the Blob.
Definition: Blob.cs:2770

MyCaffe.common.Blob.Unsqueeze
void Unsqueeze(int nNumAxes)
Unsqueeze the shape by adding shape=1 on each axis until the 'nNumAxes' is reached.
Definition: Blob.cs:201

MyCaffe.common.Blob.CopyFromAndTransposeHeightWidth
void CopyFromAndTransposeHeightWidth(Blob< T > blobSrc, bool bCopyDiff=false, bool bUseCuda=true)
Copy from a source Blob and transpose the height and width of the copy.
Definition: Blob.cs:1002

MyCaffe.common.Blob.Load
static Blob< T > Load(CudaDnn< T > cuda, Log log, BinaryReader br, bool bData, bool bDiff)
Lods a new Blob from a binary reader.
Definition: Blob.cs:2377

MyCaffe.common.Blob.num_true_axes
int num_true_axes
Returns the number of true axes, ignoring the trailing ones.
Definition: Blob.cs:716

MyCaffe.common.Blob.HalfSize
bool HalfSize
Returns whether or not this blob is using half sizes.
Definition: Blob.cs:369

MyCaffe.common.Blob.Update
void Update()
The 'update' method is used for parameter blobs in a Net.
Definition: Blob.cs:1575

MyCaffe.common.Blob.shape_string
string shape_string
Returns a string describing the Blob's shape.
Definition: Blob.cs:657

MyCaffe.common.Blob.FromByteArray
static Blob< T > FromByteArray(CudaDnn< T > cuda, Log log, byte[] rg)
A new Blob is created from the byte array, previously saved with ToByteArray.
Definition: Blob.cs:2453

MyCaffe.common.Blob.offset
int offset(List< int > rgIdx)
Returns the flat offset given the array of axes values.
Definition: Blob.cs:873

MyCaffe.common.Blob.SetCPUData
void SetCPUData(T[] rg)
Sets just the CPU data to the data specified.
Definition: Blob.cs:2052

MyCaffe.common.Blob.Reshape
void Reshape(BlobShape shape, bool? bUseHalfSize=null)
Change the dimensions of the blob, allocating new memory if necessary.
Definition: Blob.cs:637

MyCaffe.common.Blob.CopyParameters
void CopyParameters(Blob< T > b)
Copy the parameters from another blob.
Definition: Blob.cs:245

MyCaffe.common.Blob.mutable_cpu_data
T[] mutable_cpu_data
Get data from the GPU and bring it over to the host, or Set data from the Host and send it over to th...
Definition: Blob.cs:1461

MyCaffe.common.Blob.SaveToNumpy
static void SaveToNumpy(string strFile, long[] rgData, int[] rgShape)
Save a blob with data to a Numpy .npy file.
Definition: Blob.cs:3418

MyCaffe.common.Blob.asum_diff
T asum_diff()
Compute the sum of absolute values (L1 norm) of the diff.
Definition: Blob.cs:1718

MyCaffe.common.Blob.LoadFromNumpy
static Tuple< List< float[]>, int[], List< string > > LoadFromNumpy(string strFile, Log log=null, int nMax=int.MaxValue, int nStartIdx=0, int nCount=int.MaxValue)
Load the long, int, bool, float, or double data from a very large Numpy array .npy file,...
Definition: Blob.cs:3578

MyCaffe.common.Blob.One
static T One
Returns One (1) in type T.
Definition: Blob.cs:268

MyCaffe.common.Blob.Clone
Blob< T > Clone()
Copies the Blob, including its data and diff.
Definition: Blob.cs:2202

MyCaffe.common.Blob.ConvertToBase
void ConvertToBase(long hWorkMem, ulong lWorkSize, bool bData, bool bDiff)
Converts this blob from the half type to the base type.
Definition: Blob.cs:339

MyCaffe.common.Blob.DiffExists
bool DiffExists
Returns whether or not the Diff portion exists.
Definition: Blob.cs:676

MyCaffe.common.Blob.diff
SyncedMemory< T > diff
Returns the SyncedMemory that stores the diff.
Definition: Blob.cs:1444

MyCaffe.common.Blob.ConvertToHalf
void ConvertToHalf(long hWorkMem, ulong lWorkSize, bool bData, bool bDiff)
Converts this blob from its base type to the half type.
Definition: Blob.cs:306

MyCaffe.common.Blob.Reshape
void Reshape(List< int > rgShape, bool? bUseHalfSize=null)
Change the dimensions of the blob, allocating new memory if necessary.
Definition: Blob.cs:562

MyCaffe.common.Blob.Blob
Blob(CudaDnn< T > cuda, Log log, SimpleDatum d, bool bCopyData=false, bool bIncludeDiff=true, bool bUseHalfSize=false)
The Blob constructor.
Definition: Blob.cs:163

MyCaffe.common.Blob.CanonicalAxisIndex
int CanonicalAxisIndex(int nIdx)
Returns the 'canonical' version of a (usually) user-specified axis, allowing for negative indexing (e...
Definition: Blob.cs:780

MyCaffe.common.Blob.Blob
Blob(CudaDnn< T > cuda, Log log, int[] rgShape, bool bIncludeDiff=true, bool bUseHalfSize=false)
The Blob constructor.
Definition: Blob.cs:131

MyCaffe.common.Blob.cpu_data
T[] cpu_data
Returns the last host data retrieved from the GPU.
Definition: Blob.cs:1452

MyCaffe.common.Blob.SaveToNumpy
void SaveToNumpy(string strFile, bool bSaveDiff=false)
Save a blob with data to a Numpy .npy file.
Definition: Blob.cs:3259

MyCaffe.common.Blob.Reshape
void Reshape(int nNum, int nChannels, int nHeight, int nWidth, bool? bUseHalfSize=null)
DEPRECIATED; use
Definition: Blob.cs:442

MyCaffe.common.Blob.type
BLOB_TYPE type
Returns the BLOB_TYPE of the Blob.
Definition: Blob.cs:2761

MyCaffe.common.Blob.GetMinData
double GetMinData(out long lPos)
Returns the minimum data and the position where the minimum is located in the data.
Definition: Blob.cs:2512

MyCaffe.common.Blob.std
double std(double? dfMean=null, float[] rgDf=null)
Calculate the standard deviation of the blob data.
Definition: Blob.cs:3007

MyCaffe.common.Blob.MathSub
Blob< T > MathSub(Blob< T > blobA)
Clones the input Blob and subtracts the data from this blob from it.
Definition: Blob.cs:2247

MyCaffe.common.Blob.GetMaxDiff
double GetMaxDiff(out long lPos)
Returns the maximum diff and the position where the maximum is located in the diff.
Definition: Blob.cs:2590

MyCaffe.common.Blob.min_diff
double min_diff
Returns the minimum value in the diff of the Blob.
Definition: Blob.cs:2551

MyCaffe.common.Blob.ToDatum
Datum ToDatum()
Returns a new Datum that contains the shape and data of the Blob.
Definition: Blob.cs:2166

MyCaffe.common.Blob.minmax_diff
Tuple< double, double, double, double > minmax_diff(Blob< T > work, bool bDetectNans=false, bool bUseChunks=false)
Returns the minimum and maximum values in the diff of the Blob.
Definition: Blob.cs:2694

MyCaffe.common.Blob.CopyFrom
long CopyFrom(Blob< T > src, bool bCopyDiff=false, bool bReshape=false, long hDstHostBuffer=0, bool bIgnoreShape=false)
Copy from a source Blob.
Definition: Blob.cs:928

MyCaffe.common.Blob.mean
double mean(float[] rgDf=null, bool bDiff=false)
Calculate the mean of the blob data.
Definition: Blob.cs:2965

MyCaffe.common.Blob.SaveToNumpy
static void SaveToNumpy(string strFile, int[] rgData, int[] rgShape)
Save a blob with data to a Numpy .npy file.
Definition: Blob.cs:3367

MyCaffe.common.Blob.CompareShape
bool CompareShape(List< int > rgShape, bool bCompareCpuDataLen=false)
Compares the shape of this blob to another shape.
Definition: Blob.cs:2108

MyCaffe.common.Blob.Dispose
void Dispose()
Releases all resources used by the Blob (including both GPU and Host).
Definition: Blob.cs:429

MyCaffe.common.Blob.reshape_when_sharing
bool reshape_when_sharing
When true, this Blob is reshaped to the source when sharing the source data (default = false).
Definition: Blob.cs:1803

MyCaffe.common.Blob.ToByteArray
byte[] ToByteArray()
Saves this Blob to a byte array.
Definition: Blob.cs:2436

MyCaffe.common.Blob.shape
int shape(int nIdx)
Returns the dimension of the nIdx'th axis (or the negative nIdx'th axis from teh end,...
Definition: Blob.cs:696

MyCaffe.common.Blob.MathAdd
Blob< T > MathAdd(Blob< T > blobA, T fScale)
Clones the input Blob, scales the clone and then adds the data from this Blob to it.
Definition: Blob.cs:2227

MyCaffe.common.Blob.Compare
bool Compare(Blob< T > other, Blob< T > work, bool bDiff=false, double dfTol=1e-8, bool bZeroCheck=true, bool bFullCompare=false, bool bDetectNans=true, bool bForceOtherData=false)
Compare the data (or diff) of one blob to another and return true if all items fall within the specif...
Definition: Blob.cs:1093

MyCaffe.common.Blob.CopyFrom
void CopyFrom(Blob< T > src, int nSrcOffset, int nDstOffset, int nCount, bool bCopyData, bool bCopyDiff)
Copy from a source Blob.
Definition: Blob.cs:903

MyCaffe.common.Blob.scale_to_range
void scale_to_range(double dfMin, double dfMax)
Scale the data in the blob to the range [dfMin,dfMax].
Definition: Blob.cs:1773

MyCaffe.common.Blob.ShapeEquals
bool ShapeEquals(BlobProto bp)
Compares the shape of this blob to the shape within a BlobProto.
Definition: Blob.cs:2079

MyCaffe.common.Blob.update_cpu_diff
T[] update_cpu_diff()
Update the CPU diff by transferring the GPU diff over to the Host.
Definition: Blob.cs:1529

MyCaffe.common.Blob.scale_data
void scale_data(double df)
Scale the data by a scaling factor.
Definition: Blob.cs:1754

MyCaffe.common.Blob.width
int width
DEPRECIATED; legacy shape accessor width: use shape(3) instead.
Definition: Blob.cs:816

MyCaffe.common.Blob.FromProto
void FromProto(BlobProto bp, bool bReshape=true)
Create a new Blob from a given BlobProto.
Definition: Blob.cs:1589

MyCaffe.common.Blob.diff_at
T diff_at(List< int > rgIdx)
Returns the diff at a given location in the Blob.
Definition: Blob.cs:1427

MyCaffe.common.Blob.GetMinDiff
double GetMinDiff(out long lPos)
Returns the minimum diff and the position where the minimum is located in the diff.
Definition: Blob.cs:2564

MyCaffe.common.Blob.gpu_shape
long gpu_shape
Returns the shape GPU handle used by the CudaDnn connection. The shape data contains the shape inform...
Definition: Blob.cs:1565

MyCaffe.common.Blob.add_scalar
void add_scalar(double dfVal)
Adds a scalar value to the Blob.
Definition: Blob.cs:2779

MyCaffe.common.Blob.SetParameter
void SetParameter(string strName, double dfVal)
Set a blob parameter.
Definition: Blob.cs:233

MyCaffe.common.Blob.SetPixel
Tuple< T, T, T > SetPixel(int nX, int nY, byte R, byte G, byte B, TransformationParameter.COLOR_ORDER order=TransformationParameter.COLOR_ORDER.RGB)
Set the values of a 3 channel image embedded within the blob in the order RGB or BGR where the full h...
Definition: Blob.cs:3035

MyCaffe.common.Blob.ToProto
BlobProto ToProto(bool bWriteDiff=false)
Writes the Blob to a new BlobProto.
Definition: Blob.cs:1663

MyCaffe.common.Blob.Blob
Blob(Blob< T > blob, long lCount, long lOffset)
The Blob constructor used to copy another blob by creating memory pointers to its data thus sharing t...
Definition: Blob.cs:188

MyCaffe.common.Blob.Reshape
void Reshape(int[] rgShape, bool? bUseHalfSize=null)
Change the dimensions of the blob, allocating new memory if necessary.
Definition: Blob.cs:583

MyCaffe.common.Blob.LoadFromNumpy
Tuple< float[], int[]> LoadFromNumpy(string strFile, bool bLoadDiff=false, bool bLoadDataOnly=false, Log log=null, int nMax=int.MaxValue)
Load a blob with data from a Numpy array .npy file.
Definition: Blob.cs:3473

MyCaffe.common.Blob.AsyncGpuPush
void AsyncGpuPush(long hStream)
Asynchronously pushes the CPU data, previously set with SetCPUData, to the GPU.
Definition: Blob.cs:2062

MyCaffe.common.Blob.GetConversionWorkSize
ulong GetConversionWorkSize(bool bUseHalfSize)
Returns the amount of memory (in bytes) required to convert from base to half and back.
Definition: Blob.cs:293

MyCaffe.common.Blob.freeze_learning
bool freeze_learning
Specifies whether or not the diff is applied to the data during Update. When freeze learning = true,...
Definition: Blob.cs:377

MyCaffe.common.Blob.max_diff
double max_diff
Returns the maximum value in the diff of the Blob.
Definition: Blob.cs:2577

MyCaffe.common.Blob.shape
List< int > shape()
Returns an array where each element contains the shape of an axis of the Blob.
Definition: Blob.cs:684

MyCaffe.common.Blob.Zero
static T Zero
Returns Zero (0) in type T.
Definition: Blob.cs:260

MyCaffe.common.Blob.GetData
T GetData(int nIdx)
Returns the data at a given flat index within the Blob.
Definition: Blob.cs:1893

MyCaffe.common.Blob.data
SyncedMemory< T > data
Returns the SyncedMemory that stores the data.
Definition: Blob.cs:1436

MyCaffe.common.Blob.sumsq_data
T sumsq_data()
Calcualte the sum of squares (L2 norm squared) of the data.
Definition: Blob.cs:1730

MyCaffe.common.Blob.CompareEx
bool CompareEx(Blob< T > other, Blob< T > work, out double dfMin, out double dfMax, bool bDiff=false, double dfTol=1e-8, bool bZeroCheck=true, bool bFullCompare=false, bool bDetectNans=true, bool bForceOtherData=false)
Compare the data (or diff) of one blob to another and return true if all items fall within the specif...
Definition: Blob.cs:1114

MyCaffe.common.Blob.SaveToNumpy
static void SaveToNumpy(string strFile, float[] rgData, int[] rgShape)
Save a blob with data to a Numpy .npy file.
Definition: Blob.cs:3316

MyCaffe.common.Blob.update_cpu_data
T[] update_cpu_data()
Update the CPU data by transferring the GPU data over to the Host.
Definition: Blob.cs:1470

MyCaffe.common.Blob.ToString
override string ToString()
Returns a string representation of the Blob.
Definition: Blob.cs:2466

MyCaffe.common.Blob.Save
void Save(BinaryWriter bw, bool bData, bool bDiff, bool bIncludeName=true)
Saves this Blob to a binary stream.
Definition: Blob.cs:2298

MyCaffe.common.Blob.asum_data
T asum_data()
Compute the sum of absolute values (L1 norm) of the data.
Definition: Blob.cs:1706

MyCaffe.common.Blob.MAX_BLOB_AXES
const int MAX_BLOB_AXES
Defines the maximum number of Axes supported by the Blob.
Definition: Blob.cs:55

MyCaffe.common.Blob.NormalizeData
void NormalizeData(double? dfMean=null, double? dfStd=null)
Normalize the blob data by subtracting the mean and dividing by the standard deviation.
Definition: Blob.cs:2942

MyCaffe.common.Blob.scale_data
void scale_data(T fScaleFactor)
Scale the blob data by a constant factor.
Definition: Blob.cs:1782

MyCaffe.common.Blob.LoadBinary
static Blob< T > LoadBinary(CudaDnn< T > cuda, Log log, string strFile, bool bData, bool bDiff)
Loads a blob from a binary file (previously saved with SaveBinary).
Definition: Blob.cs:2359

MyCaffe.common.Blob.count
int count()
Returns the total number of items in the Blob.
Definition: Blob.cs:739

MyCaffe.common.Blob.ShareDiff
void ShareDiff(Blob< T > b)
Set the diff to point to the diff of the other blob – useful in Layers which simply perform a copy in...
Definition: Blob.cs:1832

MyCaffe.common.Blob.SetData
void SetData(SimpleDatum d, bool bReshape, bool bCopyData=true)
Sets the Blob values to the data contained within a SimpleDatum.
Definition: Blob.cs:2029

MyCaffe.common.Blob.CopyFromAndPad
void CopyFromAndPad(Blob< T > src, double dfPad=0, bool bCopyDiff=false)
Copy the source data to this Blob, and if this blob is larger than the source, pad this blob with 'df...
Definition: Blob.cs:973

MyCaffe.common.Blob.ReshapeLike
void ReshapeLike(Blob< T > b, bool? bUseHalfSize=null)
Reshape this Blob to have the same shape as another Blob.
Definition: Blob.cs:648

MyCaffe.common.Blob.Compare
bool Compare(CudaDnn< double > cuda, Blob< T > other, Blob< double > work, bool bDiff=false, double dfTol=1e-8)
Compare the data (or diff) of one blob to another and return true if all items fall within the specif...
Definition: Blob.cs:1220

MyCaffe.common.Blob.diff_at
T diff_at(int n, int c, int h, int w)
Returns the diff at a given location in the Blob.
Definition: Blob.cs:1407

MyCaffe.common.Blob.Name
string Name
Get/set the name of the Blob.
Definition: Blob.cs:2184

MyCaffe.common.Blob.offset
int offset(int n, int c=0, int h=0, int w=0)
Returns the flat offset given the number, channel, height and width.
Definition: Blob.cs:850

MyCaffe.common.Blob.Cuda
CudaDnn< T > Cuda
Returns the CudaDnn object that manages the Blob's memory."/>
Definition: Blob.cs:386

MyCaffe.common.Blob.gpu_diff
long gpu_diff
Returns the diff GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1541

MyCaffe.common.Blob.Dispose
virtual void Dispose(bool bDisposing)
Releases all resources used by the Blob (including both GPU and Host).
Definition: Blob.cs:402

MyCaffe.common.Blob.data_at
T data_at(List< int > rgIdx)
Returns the data at a given location in the Blob.
Definition: Blob.cs:1417

MyCaffe.common.Blob.SetData
void SetData(double dfVal, int nStartIdx, int nCount)
Set a data range with a given value.
Definition: Blob.cs:1961

MyCaffe.common.Blob.ToSizeString
string ToSizeString()
Returns a string describing the 4D shape of the Blob.
Definition: Blob.cs:2157

MyCaffe.common.Blob.SaveBinary
void SaveBinary(string strFile, bool bData, bool bDiff, bool bIncludeName=true)
Saves the blob to a binary file.
Definition: Blob.cs:2282

MyCaffe.common.Blob.ToString
string ToString(int nMax, bool bDiff=false)
Get the string representation containing up to the first 'nMax' items.
Definition: Blob.cs:2478

MyCaffe.common.Blob.SetDiff
void SetDiff(T[] rgDiff, int nCount=-1, bool bSetCount=true)
Sets a number of items within the Blob's diff.
Definition: Blob.cs:2018

MyCaffe.common.Blob.Blob
Blob(CudaDnn< T > cuda, Log log, BlobProto bp, bool bUseHalfSize=false)
The Blob constructor.
Definition: Blob.cs:176

MyCaffe.common.Blob.scale_diff
void scale_diff(double df)
Scale the diff by a scaling factor.
Definition: Blob.cs:1763

MyCaffe.common.Blob.Padded
bool Padded
Get/set the padding state of the blob.
Definition: Blob.cs:284

MyCaffe.common.Blob.SetDiff
void SetDiff(double dfVal, int nIdx=-1)
Either sets all of the diff items in the Blob to a given value, or alternatively only sets a single i...
Definition: Blob.cs:1981

MyCaffe.common.Blob.CopyFrom
void CopyFrom(Blob< T > blobSrc, int nChannelFrom, int nChannelTo, bool bCopyDiff=false)
Copy all data along a given channel from the source.
Definition: Blob.cs:1054

MyCaffe.common.Blob.num
int num
DEPRECIATED; legacy shape accessor num: use shape(0) instead.
Definition: Blob.cs:792

MyCaffe.common.Blob.cpu_diff
T[] cpu_diff
Returns the last host diff retrieved from the GPU.
Definition: Blob.cs:1496

MyCaffe.common.Blob.MinusOne
static T MinusOne
Returns MinusOne (-1) in type T.
Definition: Blob.cs:276

MyCaffe.common.Blob.SetData
void SetData(T fVal, int nIdx=-1)
Either sets all of the data items in the Blob to a given value, or alternatively only sets a single i...
Definition: Blob.cs:1933

MyCaffe.common.Blob.ValidateData
bool ValidateData(Blob< T > work, bool bDiff=false)
Validate the data or diff looking for NAN or Inf.
Definition: Blob.cs:1197

MyCaffe.common.Blob.snapshot_requested
bool snapshot_requested
Get/set the snapshot request.
Definition: Blob.cs:1883

MyCaffe.common.Blob.Resize
Blob< T > Resize(List< int > rgShape)
The Resize method resizes the 3rd and 4th axes of the blob.
Definition: Blob.cs:2852

MyCaffe.common.Blob.gpu_data
long gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1479

MyCaffe.common.Blob.SetData
void SetData(double dfVal, int nIdx=-1)
Either sets all of the data items in the Blob to a given value, or alternatively only sets a single i...
Definition: Blob.cs:1947

MyCaffe.common.Blob.GetMaxData
double GetMaxData(out long lPos)
Returns the maximum data and the position where the maximum is located in the data.
Definition: Blob.cs:2538

MyCaffe.common.CudaDnn
The CudaDnn object is the main interface to the Low-Level Cuda C++ DLL.
Definition: CudaDnn.cs:969

MyCaffe.common.CudaDnn.matmul
void matmul(uint nOuterCount, int m, int n, int k, long hA, long hB, long hC, double dfScale=1.0, bool bTransA=false, bool bTransB=false)
Perform matmul operation hC = matmul(hA, hB), where hA, hB and hC are all in row-major format.
Definition: CudaDnn.cs:6695

MyCaffe.common.CudaDnn.copy
void copy(int nCount, long hSrc, long hDst, int nSrcOffset=0, int nDstOffset=0, long hStream=-1, bool? bSrcHalfSizeOverride=null, bool? bDstHalfSizeOverride=null)
Copy data from one block of GPU memory to another.
Definition: CudaDnn.cs:6007

MyCaffe.common.CudaDnn.mul_scalar
void mul_scalar(int n, double fAlpha, long hY)
Mutlipy each element of Y by a scalar.
Definition: CudaDnn.cs:7374

MyCaffe.common.CudaDnn.scal
void scal(int n, double fAlpha, long hX, int nXOff=0)
Scales the data in X by a scaling factor.
Definition: CudaDnn.cs:6767

MyCaffe.common.CudaDnn.max
void max(int n, long hA, long hB, long hY)
Calculates the max of A and B and places the result in Y. This max is only computed on a per item bas...
Definition: CudaDnn.cs:7669

MyCaffe.common.CudaDnn.FreeMemory
void FreeMemory(long hMem)
Free previously allocated GPU memory.
Definition: CudaDnn.cs:2517

MyCaffe.common.CudaDnn.add_scalar
void add_scalar(int n, double fAlpha, long hY)
Adds a scalar value to each element of Y.
Definition: CudaDnn.cs:7161

MyCaffe.common.CudaDnn.scale_to_range
void scale_to_range(int n, long hX, long hY, double fMin, double fMax)
Scales the values in X and places the result in Y (can also run inline where X = Y).
Definition: CudaDnn.cs:6973

MyCaffe.common.CudaDnn.AllocMemory
long AllocMemory(List< double > rg)
Allocate a block of GPU memory and copy a list of doubles to it.
Definition: CudaDnn.cs:2291

MyCaffe.common.CudaDnn.sub
void sub(int n, long hA, long hB, long hY, int nAOff=0, int nBOff=0, int nYOff=0, int nB=0)
Subtracts B from A and places the result in Y.
Definition: CudaDnn.cs:7312

MyCaffe.common.CudaDnn.SetPixel
T[] SetPixel(long hMem, int nCount, bool bReturnOriginal, int nOffset, params Tuple< int, T >[] rgPixel)
Set a pixel value where each pixel is defined a set index, value tuple.
Definition: CudaDnn.cs:2933

MyCaffe.common.CudaDnn.add
void add(int n, long hA, long hB, long hC, long hY)
Adds A, B and C and places the result in Y.
Definition: CudaDnn.cs:7209

MyCaffe.common.CudaDnn.basetype_size
static ulong basetype_size(bool bUseHalfSize)
Returns the base type size in bytes.
Definition: CudaDnn.cs:1899

MyCaffe.common.CudaDnn.axpy
void axpy(int n, double fAlpha, long hX, long hY)
Multiply the vector X by a scalar and add the result to the vector Y.
Definition: CudaDnn.cs:6544

MyCaffe.common.CudaDnn.transposeHW
void transposeHW(int n, int c, int h, int w, long hSrc, long hDst)
Transpose a n*c number of matrices along the height and width dimensions. All matrices are in row-maj...
Definition: CudaDnn.cs:6716

MyCaffe.common.CudaDnn.minmax
Tuple< double, double, double, double > minmax(int n, long hA, long hWork1, long hWork2, bool bDetectNans=false, int nAOff=0)
Finds the minimum and maximum values within A.
Definition: CudaDnn.cs:7818

MyCaffe.common.CudaDnn.GetMemoryDouble
double[] GetMemoryDouble(long hMem, long lCount=-1)
Retrieves the GPU memory as an array of doubles.
Definition: CudaDnn.cs:2677

MyCaffe.common.CudaDnn.channel_percentile
void channel_percentile(int nCount, int nOuterNum, int nChannels, int nInnerNum, long hX, long hY, double dfPercentile)
Calculates the percentile along axis = 0.
Definition: CudaDnn.cs:8361

MyCaffe.common.CudaDnn.set
void set(int nCount, long hHandle, double fVal, int nIdx=-1)
Set the values of GPU memory to a specified value of type
Definition: CudaDnn.cs:5897

MyCaffe.common.CudaDnn.asum_double
double asum_double(int n, long hX, int nXOff=0)
Computes the sum of absolute values in X.
Definition: CudaDnn.cs:6871

MyCaffe.common.CudaDnn.asum
T asum(int n, long hX, int nXOff=0)
Computes the sum of absolute values in X.
Definition: CudaDnn.cs:6901

MyCaffe.common.CudaDnn.min
void min(int n, long hA, long hB, long hY)
Calculates the min of A and B and places the result in Y. This min is only computed on a per item bas...
Definition: CudaDnn.cs:7702

MyCaffe.common.CudaDnn.get
T[] get(int nCount, long hHandle, int nIdx=-1)
Queries the GPU memory by copying it into an array of type 'T'.
Definition: CudaDnn.cs:5985

MyCaffe.common.CudaDnn.GetMemoryFloat
float[] GetMemoryFloat(long hMem, long lCount=-1)
Retrieves the GPU memory as an array of float.
Definition: CudaDnn.cs:2689

MyCaffe.common.CudaDnn.dot
T dot(int n, long hX, long hY, int nXOff=0, int nYOff=0)
Computes the dot product of X and Y.
Definition: CudaDnn.cs:6847

MyCaffe.common.SyncedMemory
The SyncedMemory manages the low-level connection between the GPU and host memory.
Definition: SyncedMemory.cs:18

MyCaffe.common.SyncedMemory.HalfSize
bool HalfSize
Returns whether or not the sync memory is half-sized memory.
Definition: SyncedMemory.cs:266

MyCaffe.common.SyncedMemory.async_gpu_push
void async_gpu_push(long hStream, T[] rg)
Pushes the host data, previously set with set_cpu_data_locally(), to the GPU.
Definition: SyncedMemory.cs:446

MyCaffe.common.SyncedMemory.gpu_data
long gpu_data
Returns the handle to the GPU memory.
Definition: SyncedMemory.cs:308

MyCaffe.common.SyncedMemory.Tag
object Tag
Get/set data associated with the synced memory.
Definition: SyncedMemory.cs:274

MyCaffe.common.SyncedMemory.set_gpu_data
void set_gpu_data(long hData, long lCount, long lOffset)
Copies a new Memory Pointer within the low-level CudaDnnDLL where a Memory Pointer uses another alrea...
Definition: SyncedMemory.cs:319

MyCaffe.common.SyncedMemory.mutable_cpu_data
T[] mutable_cpu_data
Get/set the mutable host data.
Definition: SyncedMemory.cs:386

MyCaffe.common.SyncedMemory.Copy
long Copy(SyncedMemory< T > src, long hDstHostBuffer=0)
Copy another SyncedMemory into this one.
Definition: SyncedMemory.cs:205

MyCaffe.common.SyncedMemory.Dispose
void Dispose()
Releases all GPU and host resources used.
Definition: SyncedMemory.cs:77

MyCaffe.common.SyncedMemory.SetData
void SetData(T[] rgData, int nCount, bool bSetCount=true)
Sets the array of host data on the GPU and re-allocates the GPU memory if needed.
Definition: SyncedMemory.cs:359

MyCaffe.common.SyncedMemory.Allocate
void Allocate(long lCount, bool bUseHalfSize=false)
Allocate a number of items in GPU memory and save the handle.
Definition: SyncedMemory.cs:92

MyCaffe.common.SyncedMemory.Capacity
long Capacity
Returns the total amount of GPU memory held by this SyncedMemory.
Definition: SyncedMemory.cs:291

MyCaffe.common.SyncedMemory.GetAt
T GetAt(int nIdx)
Return a value at a given index.
Definition: SyncedMemory.cs:192

MyCaffe.common.SyncedMemory.mutable_gpu_data
long mutable_gpu_data
Returns the mutable handle to GPU data.
Definition: SyncedMemory.cs:336

MyCaffe.common.SyncedMemory.update_cpu_data
T[] update_cpu_data(long lCount=-1)
Updates the host data by copying the GPU data to the host data.
Definition: SyncedMemory.cs:409

MyCaffe.common.SyncedMemory.cpu_data
T[] cpu_data
Returns the data on the CPU that has already been transferred from GPU to CPU.
Definition: SyncedMemory.cs:349

MyCaffe.common.SyncedMemory.ZeroAll
void ZeroAll()
Set all items in the GPU memory up to the Capacity, to zero.
Definition: SyncedMemory.cs:154

MyCaffe.common.SyncedMemory.set_cpu_data_locally
void set_cpu_data_locally(T[] rg)
This does not place the data on the GPU - call async_gpu_push() to move it to the GPU.
Definition: SyncedMemory.cs:433

MyCaffe.common.SyncedMemory.Count
long Count
Returns the current count of items in this SyncedMemory. Note, the Count may be less than the Capacit...
Definition: SyncedMemory.cs:299

MyCaffe.param.BlobProto
The BlobProto contains the descripion of a blob.
Definition: BlobProto.cs:15

MyCaffe.param.BlobProto.data
List< float > data
Get/set the data as a List of float.
Definition: BlobProto.cs:180

MyCaffe.param.BlobProto.double_diff
List< double > double_diff
Get/set the diff as a List of double.
Definition: BlobProto.cs:171

MyCaffe.param.BlobProto.shape
BlobShape shape
Specifies the shape of the Blob.
Definition: BlobProto.cs:117

MyCaffe.param.BlobProto.double_data
List< double > double_data
Get/set the data as a List of double.
Definition: BlobProto.cs:162

MyCaffe.param.BlobProto.num
int? num
Specifies the number of inputs (such as images) in the Blob.
Definition: BlobProto.cs:126

MyCaffe.param.BlobProto.diff
List< float > diff
Get/set the diff as a List of float.
Definition: BlobProto.cs:189

MyCaffe.param.BlobProto.height
int? height
Specifies the height of each input.
Definition: BlobProto.cs:144

MyCaffe.param.BlobProto.channels
int? channels
Specifies the number of images per input.
Definition: BlobProto.cs:135

MyCaffe.param.BlobProto.width
int? width
Specifies the width of each input.
Definition: BlobProto.cs:153

MyCaffe.param.BlobShape
Specifies the shape of a Blob.
Definition: BlobShape.cs:15

MyCaffe.param.BlobShape.dim
List< int > dim
The blob shape dimensions.
Definition: BlobShape.cs:93

MyCaffe.param.TransformationParameter
Stores parameters used to apply transformation to the data layer's data.
Definition: TransformationParameter.cs:19

MyCaffe.param.TransformationParameter.COLOR_ORDER
COLOR_ORDER
Defines the color ordering used to tranform the input data.
Definition: TransformationParameter.cs:63

MyCaffe.basecode
The MyCaffe.basecode contains all generic types used throughout MyCaffe.
Definition: Annotation.cs:12

MyCaffe.common
The MyCaffe.common namespace contains common MyCaffe classes.
Definition: BatchInput.cs:8

MyCaffe.common.BLOB_TYPE
BLOB_TYPE
Defines the tpe of data held by a given Blob.
Definition: Interfaces.cs:62

MyCaffe.param
The MyCaffe.param namespace contains parameters used to create models.
Definition: AttentionParameter.cs:9

MyCaffe
The MyCaffe namespace contains the main body of MyCaffe code that closesly tracks the C++ Caffe open-...
Definition: Annotation.cs:12

System
Definition: Component.cs:11