mycaffe/html/_synced_memory_8cs_source.html

using System;

using System.Collections.Generic;

using System.Linq;

using System.Text;

using MyCaffe.basecode;


namespace MyCaffe.common

{

    public class SyncedMemory<T> : IDisposable

    {

        Log m_log;

        CudaDnn<T> m_cuda;

        int m_nDeviceID = -1;

        long m_lCapacity = 0;

        long m_lCount = 0;

        long m_hGpuData = 0;

        T[] m_rgCpuData = null;

        bool m_bOwnData = true;

        bool m_bHalfSize = false;

        object m_tag = null;


        public SyncedMemory(CudaDnn<T> cuda, Log log, long lCapacity = 0, object tag = null, bool bUseHalfSize = false)

        {

            if (bUseHalfSize && typeof(T) != typeof(float))

            {

                bUseHalfSize = false;


                if (log != null)

                    log.WriteLine("Half size disabled for non 'float' basetypes!");

            }


            m_bHalfSize = bUseHalfSize;

            m_cuda = cuda;

            m_log = log;

            m_tag = tag;


            if (lCapacity > 0)

            {

                m_nDeviceID = m_cuda.GetDeviceID();

                m_hGpuData = m_cuda.AllocMemory(lCapacity);

                m_lCapacity = lCapacity;

                m_lCount = lCapacity;

            }

        }


        private void free()

        {

            if (m_hGpuData != 0)

            {

                check_device();

                if (m_bOwnData)

                    m_cuda.FreeMemory(m_hGpuData);

                else

                    m_cuda.FreeMemoryPointer(m_hGpuData);

            }

        }


        public void Dispose()

        {

            free();

            m_hGpuData = 0;

            m_nDeviceID = -1;

            m_lCapacity = 0;

            m_lCount = 0;

            m_rgCpuData = null;

        }


        public void Allocate(long lCount, bool bUseHalfSize = false)

        {

            if (bUseHalfSize && typeof(T) != typeof(float))

            {

                bUseHalfSize = false;


                if (m_log != null)

                    m_log.WriteLine("Half size disabled for non 'float' basetypes!");

            }


            free();

            m_nDeviceID = m_cuda.GetDeviceID();

            m_bHalfSize = bUseHalfSize;

            m_hGpuData = m_cuda.AllocMemory(lCount, m_bHalfSize);

            m_lCapacity = lCount;

            m_lCount = 0;

            m_bOwnData = true;

            return;

        }


        public void Allocate(T[] rg, bool bUseHalfSize = false)

        {

            if (bUseHalfSize && typeof(T) != typeof(float))

            {

                bUseHalfSize = false;


                if (m_log != null)

                    m_log.WriteLine("Half size disabled for non 'float' basetypes!");

            }


            free();

            m_nDeviceID = m_cuda.GetDeviceID();

            m_bHalfSize = bUseHalfSize;

            m_hGpuData = m_cuda.AllocMemory(rg, 0, m_bHalfSize);

            m_lCapacity = rg.Length;

            m_lCount = rg.Length;

            m_bOwnData = true;

            check_device();


            return;

        }


        public void Zero()

        {

            if (m_lCount > 0)

            {

                check_device();

                m_cuda.set((int)m_lCount, m_hGpuData, 0.0);

            }

        }


        public void ZeroAll()

        {

            if (m_lCapacity > 0)

            {

                check_device();

                m_cuda.set((int)m_lCapacity, m_hGpuData, 0.0);

            }

        }


        public void Set(double dfVal)

        {

            if (m_lCount > 0)

            {

                check_device();

                m_cuda.set((int)m_lCount, m_hGpuData, dfVal);

            }

        }


        public void SetAt(int nIdx, T fVal)

        {

            check_device();

            m_cuda.set((int)m_lCount, m_hGpuData, fVal, nIdx);

        }


        public T GetAt(int nIdx)

        {

            check_device();

            T[] rg = m_cuda.get((int)m_lCount, m_hGpuData, nIdx);

            return rg[0];

        }


        public long Copy(SyncedMemory<T> src, long hDstHostBuffer = 0)

        {

            if (src == null)

            {

                m_lCount = 0;

                return hDstHostBuffer;

            }


            if (m_lCapacity < src.m_lCount)

                Allocate(src.m_lCount);


            m_lCount = src.m_lCount;


            if (m_lCount > 0)

            {

                if (m_cuda.KernelHandle == src.m_cuda.KernelHandle)

                {

                    check_device();

                    m_cuda.copy((int)m_lCount, src.m_hGpuData, m_hGpuData);

                }

                else

                {

                    if (hDstHostBuffer == 0)

                    {

                        hDstHostBuffer = m_cuda.AllocHostBuffer(m_lCount);

                    }

                    else

                    {

                        long lCount = m_cuda.GetHostBufferCapacity(hDstHostBuffer);

                        if (lCount < m_lCount)

                        {

                            m_cuda.FreeHostBuffer(hDstHostBuffer);

                            hDstHostBuffer = m_cuda.AllocHostBuffer(m_lCount);

                        }

                    }


                    src.m_cuda.KernelCopy((int)m_lCount, src.m_hGpuData, 0, m_cuda.KernelHandle, m_hGpuData, 0, hDstHostBuffer, m_cuda.KernelHandle);

                }

            }


            return hDstHostBuffer;

        }


        public SyncedMemory<T> Clone()

        {

            SyncedMemory<T> dst = new SyncedMemory<T>(m_cuda, m_log, m_lCapacity, null, m_bHalfSize);


            if (m_lCount > 0)

                dst.Copy(this);


            return dst;

        }


        public bool HalfSize

        {

            get { return m_bHalfSize; }

        }


        public object Tag

        {

            get { return m_tag; }

            set { m_tag = value; }

        }


        public int DeviceID

        {

            get { return m_nDeviceID; }

        }


        public long Capacity

        {

            get { return m_lCapacity; }

        }


        public long Count

        {

            get { return m_lCount; }

            set { m_lCount= value; }

        }


        public long gpu_data

        {

            get { return m_hGpuData; }

        }


        public void set_gpu_data(long hData, long lCount, long lOffset)

        {

            free();

            m_hGpuData = m_cuda.CreateMemoryPointer(hData, lOffset, lCount);

            m_lCapacity = lCount;

            m_lCount = lCount;

            m_bOwnData = false;

            check_device();

        }


        public long mutable_gpu_data

        {

            get

            {

                check_device();

                return m_hGpuData;

            }

//          set { m_hGpuData = value; }

        }


        public T[] cpu_data

        {

            get { return m_rgCpuData; }

        }


        public void SetData(T[] rgData, int nCount, bool bSetCount = true)

        {

            if (nCount == -1)

                nCount = rgData.Length;


            if (nCount > m_lCapacity || m_hGpuData == 0)

            {

                bSetCount = true;

                Allocate(nCount);

            }


            m_cuda.SetMemory(m_hGpuData, rgData, 0, nCount);


            if (bSetCount)

                m_lCount = nCount;


            check_device();

        }


        public T[] mutable_cpu_data

        {

            get { return update_cpu_data(); }

            set

            {

                check_device();

                if (value.Length > m_lCapacity || m_hGpuData == 0)

                {

                    Allocate(value);

                }

                else

                {

                    m_cuda.SetMemory(m_hGpuData, value);

                    m_lCount = value.Length;

                    check_device();

                }

            }

        }


        public T[] update_cpu_data(long lCount = -1)

        {

            if (lCount >= 0)

            {

                if (lCount > m_lCapacity)

                    throw new ArgumentOutOfRangeException();


                m_lCount = lCount;

            }


            check_device();


            if (m_lCount == 0)

                m_rgCpuData = new List<T>().ToArray();

            else

                m_rgCpuData = m_cuda.GetMemory(m_hGpuData, m_lCount);


            return m_rgCpuData;

        }


        public void set_cpu_data_locally(T[] rg)

        {

            m_rgCpuData = rg;

        }


        public void async_gpu_push(long hStream, T[] rg)

        {

            check_device();

            if (m_hGpuData == 0)

            {

                m_hGpuData = m_cuda.AllocMemory(rg, hStream);

                m_lCapacity = rg.Length;

            }

            else

            {

                m_cuda.SetMemory(m_hGpuData, rg, hStream);

            }


            m_lCount = rg.Length;

            check_device();

        }


        private void check_device()

        {

#if DEBUG

            if (m_lCount > 0)

            {

                int nDeviceId = m_cuda.GetDeviceID();

                m_log.CHECK_EQ(nDeviceId, m_nDeviceID, "The current device DOES'NT match the device for which the memory was allocated!");

            }

#endif

        }

    }

}

MyCaffe.basecode.Log
The Log class provides general output in text form.
Definition: Log.cs:13

MyCaffe.basecode.Log.WriteLine
void WriteLine(string str, bool bOverrideEnabled=false, bool bHeader=false, bool bError=false, bool bDisable=false)
Write a line of output.
Definition: Log.cs:80

MyCaffe.common.CudaDnn
The CudaDnn object is the main interface to the Low-Level Cuda C++ DLL.
Definition: CudaDnn.cs:969

MyCaffe.common.CudaDnn.GetMemory
T[] GetMemory(long hMem, long lCount=-1)
Retrieves the GPU memory as an array of type 'T'
Definition: CudaDnn.cs:2700

MyCaffe.common.CudaDnn.GetDeviceID
int GetDeviceID()
Returns the current device id set within Cuda.
Definition: CudaDnn.cs:2013

MyCaffe.common.CudaDnn.copy
void copy(int nCount, long hSrc, long hDst, int nSrcOffset=0, int nDstOffset=0, long hStream=-1, bool? bSrcHalfSizeOverride=null, bool? bDstHalfSizeOverride=null)
Copy data from one block of GPU memory to another.
Definition: CudaDnn.cs:6007

MyCaffe.common.CudaDnn.FreeMemory
void FreeMemory(long hMem)
Free previously allocated GPU memory.
Definition: CudaDnn.cs:2517

MyCaffe.common.CudaDnn.CreateMemoryPointer
long CreateMemoryPointer(long hData, long lOffset, long lCount)
Creates a memory pointer into an already existing block of GPU memory.
Definition: CudaDnn.cs:3028

MyCaffe.common.CudaDnn.SetMemory
void SetMemory(long hMem, List< double > rg)
Copies a list of doubles into a block of already allocated GPU memory.
Definition: CudaDnn.cs:2734

MyCaffe.common.CudaDnn.AllocMemory
long AllocMemory(List< double > rg)
Allocate a block of GPU memory and copy a list of doubles to it.
Definition: CudaDnn.cs:2291

MyCaffe.common.CudaDnn.AllocHostBuffer
long AllocHostBuffer(long lCapacity)
Allocate a block of host memory with a specified capacity.
Definition: CudaDnn.cs:2581

MyCaffe.common.CudaDnn.GetHostBufferCapacity
long GetHostBufferCapacity(long hMem)
Returns the host memory capacity.
Definition: CudaDnn.cs:2621

MyCaffe.common.CudaDnn.FreeHostBuffer
void FreeHostBuffer(long hMem)
Free previously allocated host memory.
Definition: CudaDnn.cs:2602

MyCaffe.common.CudaDnn.set
void set(int nCount, long hHandle, double fVal, int nIdx=-1)
Set the values of GPU memory to a specified value of type
Definition: CudaDnn.cs:5897

MyCaffe.common.CudaDnn.KernelHandle
long KernelHandle
Returns the Low-Level kernel handle used for this instance. Each Low-Level kernel maintains its own s...
Definition: CudaDnn.cs:1812

MyCaffe.common.CudaDnn.FreeMemoryPointer
void FreeMemoryPointer(long hData)
Frees a memory pointer.
Definition: CudaDnn.cs:3046

MyCaffe.common.CudaDnn.get
T[] get(int nCount, long hHandle, int nIdx=-1)
Queries the GPU memory by copying it into an array of type 'T'.
Definition: CudaDnn.cs:5985

MyCaffe.common.SyncedMemory
The SyncedMemory manages the low-level connection between the GPU and host memory.
Definition: SyncedMemory.cs:18

MyCaffe.common.SyncedMemory.HalfSize
bool HalfSize
Returns whether or not the sync memory is half-sized memory.
Definition: SyncedMemory.cs:266

MyCaffe.common.SyncedMemory.Allocate
void Allocate(T[] rg, bool bUseHalfSize=false)
Allocate a number of items and copy the given array into the memory on the GPU.
Definition: SyncedMemory.cs:117

MyCaffe.common.SyncedMemory.Zero
void Zero()
Set all items in the GPU memory up to the Count, to zero.
Definition: SyncedMemory.cs:142

MyCaffe.common.SyncedMemory.Set
void Set(double dfVal)
Set all items up to Count to a given value.
Definition: SyncedMemory.cs:167

MyCaffe.common.SyncedMemory.async_gpu_push
void async_gpu_push(long hStream, T[] rg)
Pushes the host data, previously set with set_cpu_data_locally(), to the GPU.
Definition: SyncedMemory.cs:446

MyCaffe.common.SyncedMemory.gpu_data
long gpu_data
Returns the handle to the GPU memory.
Definition: SyncedMemory.cs:308

MyCaffe.common.SyncedMemory.Tag
object Tag
Get/set data associated with the synced memory.
Definition: SyncedMemory.cs:274

MyCaffe.common.SyncedMemory.set_gpu_data
void set_gpu_data(long hData, long lCount, long lOffset)
Copies a new Memory Pointer within the low-level CudaDnnDLL where a Memory Pointer uses another alrea...
Definition: SyncedMemory.cs:319

MyCaffe.common.SyncedMemory.mutable_cpu_data
T[] mutable_cpu_data
Get/set the mutable host data.
Definition: SyncedMemory.cs:386

MyCaffe.common.SyncedMemory.Copy
long Copy(SyncedMemory< T > src, long hDstHostBuffer=0)
Copy another SyncedMemory into this one.
Definition: SyncedMemory.cs:205

MyCaffe.common.SyncedMemory.Dispose
void Dispose()
Releases all GPU and host resources used.
Definition: SyncedMemory.cs:77

MyCaffe.common.SyncedMemory.SyncedMemory
SyncedMemory(CudaDnn< T > cuda, Log log, long lCapacity=0, object tag=null, bool bUseHalfSize=false)
The SyncedMemory constructor.
Definition: SyncedMemory.cs:38

MyCaffe.common.SyncedMemory.SetData
void SetData(T[] rgData, int nCount, bool bSetCount=true)
Sets the array of host data on the GPU and re-allocates the GPU memory if needed.
Definition: SyncedMemory.cs:359

MyCaffe.common.SyncedMemory.Allocate
void Allocate(long lCount, bool bUseHalfSize=false)
Allocate a number of items in GPU memory and save the handle.
Definition: SyncedMemory.cs:92

MyCaffe.common.SyncedMemory.Capacity
long Capacity
Returns the total amount of GPU memory held by this SyncedMemory.
Definition: SyncedMemory.cs:291

MyCaffe.common.SyncedMemory.Clone
SyncedMemory< T > Clone()
Copy this SyncedMemory.
Definition: SyncedMemory.cs:252

MyCaffe.common.SyncedMemory.GetAt
T GetAt(int nIdx)
Return a value at a given index.
Definition: SyncedMemory.cs:192

MyCaffe.common.SyncedMemory.mutable_gpu_data
long mutable_gpu_data
Returns the mutable handle to GPU data.
Definition: SyncedMemory.cs:336

MyCaffe.common.SyncedMemory.update_cpu_data
T[] update_cpu_data(long lCount=-1)
Updates the host data by copying the GPU data to the host data.
Definition: SyncedMemory.cs:409

MyCaffe.common.SyncedMemory.cpu_data
T[] cpu_data
Returns the data on the CPU that has already been transferred from GPU to CPU.
Definition: SyncedMemory.cs:349

MyCaffe.common.SyncedMemory.SetAt
void SetAt(int nIdx, T fVal)
Set a specific item at a given index to a value.
Definition: SyncedMemory.cs:181

MyCaffe.common.SyncedMemory.ZeroAll
void ZeroAll()
Set all items in the GPU memory up to the Capacity, to zero.
Definition: SyncedMemory.cs:154

MyCaffe.common.SyncedMemory.set_cpu_data_locally
void set_cpu_data_locally(T[] rg)
This does not place the data on the GPU - call async_gpu_push() to move it to the GPU.
Definition: SyncedMemory.cs:433

MyCaffe.common.SyncedMemory.DeviceID
int DeviceID
Returns the Device ID on which the GPU memory of this SyncedMemory was allocated.
Definition: SyncedMemory.cs:283

MyCaffe.common.SyncedMemory.Count
long Count
Returns the current count of items in this SyncedMemory. Note, the Count may be less than the Capacit...
Definition: SyncedMemory.cs:299

MyCaffe.basecode
The MyCaffe.basecode contains all generic types used throughout MyCaffe.
Definition: Annotation.cs:12

MyCaffe.common
The MyCaffe.common namespace contains common MyCaffe classes.
Definition: BatchInput.cs:8

MyCaffe
The MyCaffe namespace contains the main body of MyCaffe code that closesly tracks the C++ Caffe open-...
Definition: Annotation.cs:12

System
Definition: Component.cs:11