mycaffe/html/_cfc_unit_layer_8cs_source.html

using System;

using System.Collections.Concurrent;

using System.Collections.Generic;

using System.Diagnostics;

using System.Linq;

using System.Text;

using MyCaffe.basecode;

using MyCaffe.common;

using MyCaffe.param;

using MyCaffe.param.lnn;


namespace MyCaffe.layers.lnn

{

    public class CfcUnitLayer<T> : LnnUnitLayer<T>

    {

        Layer<T> m_cat;

        Layer<T>[] m_rgLinearLayers = null;

        Layer<T>[] m_rgActivationLayers = null;

        Layer<T>[] m_rgDropoutLayers = null;

        BlobCollection<T> m_rgLinearBtms = new BlobCollection<T>();

        BlobCollection<T> m_rgLinearTops = new BlobCollection<T>();

        BlobCollection<T> m_rgActivationBtms = new BlobCollection<T>();

        BlobCollection<T> m_rgActivationTops = new BlobCollection<T>();

        BlobCollection<T> m_colTop = new BlobCollection<T>();

        BlobCollection<T> m_colBtm = new BlobCollection<T>();

        Layer<T> m_tanh;

        Layer<T> m_sigmoid;

        Layer<T> m_ff1;

        Layer<T> m_ff2;

        Layer<T> m_timeA;

        Layer<T> m_timeB;

        Blob<T> m_blobFF1;

        Blob<T> m_blobFF2;

        Blob<T> m_blobTimeA;

        Blob<T> m_blobTimeB;

        Blob<T> m_blobTInterp;

        Blob<T> m_blobTInterp1;

        Blob<T> m_blobTInterpInv;

        Blob<T> m_blobTInterpOnes;

        Blob<T> m_blobTs;

        Blob<T> m_blobX;

        Blob<T> m_blobTop1;

        Blob<T> m_blobTop2;

        int m_nNumLayers;

        int m_nNumUnits;


        public CfcUnitLayer(CudaDnn<T> cuda, Log log, LayerParameter p)

            : base(cuda, log, p)

        {

            m_type = LayerParameter.LayerType.CFC_UNIT;


            m_nNumLayers = m_param.cfc_unit_param.backbone_layers;

            m_nNumUnits = m_param.cfc_unit_param.backbone_units;


            if (m_nNumLayers < 1)

                m_nNumLayers = 1;


            LayerParameter concat = new LayerParameter(LayerParameter.LayerType.CONCAT, "concat");

            concat.concat_param.axis = 1;

            m_cat = Layer<T>.Create(m_cuda, m_log, convertLayerParam(concat, p), null);


            Blob<T> blobBtm = new Blob<T>(m_cuda, m_log);

            blobBtm.Name = "bb";


            for (int i = 0; i < m_nNumLayers; i++)

            {

                // Linear Layer

                m_rgLinearBtms.Add(blobBtm);


                Blob<T> blobTop = new Blob<T>(m_cuda, m_log);

                blobTop.Name = "bb_" + i.ToString();


                m_rgLinearTops.Add(blobTop);


                // Activation Layer

                blobBtm = blobTop;

                m_rgActivationBtms.Add(blobBtm);


                blobTop = new Blob<T>(m_cuda, m_log);

                blobTop.Name = "bb_act_" + i.ToString();


                m_rgActivationTops.Add(blobTop);

                blobBtm = blobTop;

            }


            m_rgLinearLayers = new Layer<T>[m_nNumLayers];

            m_rgActivationLayers = new Layer<T>[m_nNumLayers];


            if (m_param.cfc_unit_param.backbone_dropout_ratio > 0)

                m_rgDropoutLayers = new Layer<T>[m_nNumLayers];


            for (int i = 0; i < m_nNumLayers; i++)

            {

                LayerParameter ip = new LayerParameter(LayerParameter.LayerType.INNERPRODUCT, "bb_" + i.ToString());

                ip.inner_product_param.num_output = (uint)m_nNumUnits;

                ip.inner_product_param.bias_term = true;

                ip.inner_product_param.weight_filler = new FillerParameter("xavier", 0.0, 0.01);

                ip.inner_product_param.bias_filler = new FillerParameter("constant", 0.1);

                m_rgLinearLayers[i] = Layer<T>.Create(m_cuda, m_log, convertLayerParam(ip, p), null);


                LayerParameter act;

                switch (m_param.cfc_unit_param.backbone_activation)

                {

                    case CfcUnitParameter.ACTIVATION.SILU:

                        act = new LayerParameter(LayerParameter.LayerType.SILU, "bb_act_" + i.ToString());

                        break;


                    case CfcUnitParameter.ACTIVATION.RELU:

                        act = new LayerParameter(LayerParameter.LayerType.RELU, "bb_act_" + i.ToString());

                        break;


                    case CfcUnitParameter.ACTIVATION.TANH:

                        act = new LayerParameter(LayerParameter.LayerType.TANH, "bb_act_" + i.ToString());

                        break;


                    case CfcUnitParameter.ACTIVATION.GELU:

                        act = new LayerParameter(LayerParameter.LayerType.GELU, "bb_act_" + i.ToString());

                        break;


                    case CfcUnitParameter.ACTIVATION.LECUN:

                        act = new LayerParameter(LayerParameter.LayerType.LECUN, "bb_act_" + i.ToString());

                        break;


                    default:

                        throw new Exception("Unknown activation type: " + m_param.cfc_unit_param.backbone_activation.ToString());

                }


                m_rgActivationLayers[i] = Layer<T>.Create(m_cuda, m_log, convertLayerParam(act, p), null);


                if (i > 0 && m_rgDropoutLayers != null)

                {

                    LayerParameter drop = new LayerParameter(LayerParameter.LayerType.DROPOUT, "bb_drop_" + i.ToString());

                    drop.dropout_param.dropout_ratio = m_param.cfc_unit_param.backbone_dropout_ratio;


                    m_rgDropoutLayers[i] = Layer<T>.Create(m_cuda, m_log, convertLayerParam(drop, p), null);

                }

            }


            m_blobX = new Blob<T>(m_cuda, m_log);

            m_blobX.Name = "x";


            // FF1 Layer

            LayerParameter ff1 = new LayerParameter(LayerParameter.LayerType.INNERPRODUCT, "ff1");

            ff1.inner_product_param.num_output = (uint)m_param.cfc_unit_param.hidden_size;

            ff1.inner_product_param.bias_term = true;

            ff1.inner_product_param.weight_filler = new FillerParameter("xavier", 0.0, 0.01);

            ff1.inner_product_param.bias_filler = new FillerParameter("constant", 0.1);

            m_ff1 = Layer<T>.Create(m_cuda, m_log, convertLayerParam(ff1, p), null);


            m_blobFF1 = new Blob<T>(m_cuda, m_log);

            m_blobFF1.Name = "ff1";


            // Tanh Layer

            LayerParameter tanh = new LayerParameter(LayerParameter.LayerType.TANH, "tanh");

            m_tanh = Layer<T>.Create(m_cuda, m_log, convertLayerParam(tanh, p), null);


            // FF2 Layer

            LayerParameter ff2 = new LayerParameter(LayerParameter.LayerType.INNERPRODUCT, "ff2");

            ff2.inner_product_param.num_output = (uint)m_param.cfc_unit_param.hidden_size;

            ff2.inner_product_param.bias_term = true;

            ff2.inner_product_param.weight_filler = new FillerParameter("xavier", 0.0, 0.01);

            ff2.inner_product_param.bias_filler = new FillerParameter("constant", 0.1);

            m_ff2 = Layer<T>.Create(m_cuda, m_log, convertLayerParam(ff2, p), null);


            m_blobFF2 = new Blob<T>(m_cuda, m_log);

            m_blobFF2.Name = "ff2";


            // Time A Layer

            LayerParameter timeA = new LayerParameter(LayerParameter.LayerType.INNERPRODUCT, "time_a");

            timeA.inner_product_param.num_output = (uint)m_param.cfc_unit_param.hidden_size;

            timeA.inner_product_param.bias_term = true;

            timeA.inner_product_param.weight_filler = new FillerParameter("xavier", 0.0, 0.01);

            timeA.inner_product_param.bias_filler = new FillerParameter("constant", 0.1);

            m_timeA = Layer<T>.Create(m_cuda, m_log, convertLayerParam(timeA, p), null);


            m_blobTimeA = new Blob<T>(m_cuda, m_log);

            m_blobTimeA.Name = "time_a";


            // Time B Layer

            LayerParameter timeB = new LayerParameter(LayerParameter.LayerType.INNERPRODUCT, "time_b");

            timeB.inner_product_param.num_output = (uint)m_param.cfc_unit_param.hidden_size;

            timeB.inner_product_param.bias_term = true;

            timeB.inner_product_param.weight_filler = new FillerParameter("xavier", 0.0, 0.01);

            timeB.inner_product_param.bias_filler = new FillerParameter("constant", 0.1);

            m_timeB = Layer<T>.Create(m_cuda, m_log, convertLayerParam(timeB, p), null);


            m_blobTimeB = new Blob<T>(m_cuda, m_log);

            m_blobTimeB.Name = "time_b";


            // Sigmoid Layer

            LayerParameter sigmoid = new LayerParameter(LayerParameter.LayerType.SIGMOID, "sigmoid");

            m_sigmoid = Layer<T>.Create(m_cuda, m_log, convertLayerParam(sigmoid, p), null);


            // T-Interp

            m_blobTInterp = new Blob<T>(m_cuda, m_log);

            m_blobTInterp.Name = "t-interp";


            m_blobTInterpInv = new Blob<T>(m_cuda, m_log);

            m_blobTInterpInv.Name = "t-interpinv";


            m_blobTInterp1 = new Blob<T>(m_cuda, m_log);

            m_blobTInterp1.Name = "t-interp1";

            m_blobTInterpOnes = new Blob<T>(m_cuda, m_log, true);

            m_blobTInterpOnes.Name = "t_interp_ones";


            m_blobTs = new Blob<T>(m_cuda, m_log);

            m_blobTs.Name = "ts";


            m_blobTop1 = new Blob<T>(m_cuda, m_log);

            m_blobTop1.Name = "top1";

            m_blobTop2 = new Blob<T>(m_cuda, m_log);

            m_blobTop2.Name = "top2";

        }


        protected override void dispose()

        {

            base.dispose();


            if (m_rgLinearLayers != null)

            {

                for (int i = 0; i < m_rgLinearLayers.Length; i++)

                {

                    m_rgLinearLayers[i].Dispose();

                }

                m_rgLinearLayers = null;

            }


            if (m_bOwnInternalBlobs)

                dispose_internal_blobs();

            else

                clear_internal_blobs();


            dispose(ref m_blobTInterpOnes);


            dispose(ref m_cat);

            dispose(ref m_tanh);

            dispose(ref m_sigmoid);

            dispose(ref m_ff1);

            dispose(ref m_ff2);

            dispose(ref m_timeA);

            dispose(ref m_timeB);

        }


        private void dispose_internal_blobs(bool bSetToNull = true)

        {

            dispose(ref m_rgLinearBtms, bSetToNull);

            dispose(ref m_rgLinearTops, bSetToNull);

            dispose(ref m_rgActivationBtms, bSetToNull);

            dispose(ref m_rgActivationTops, bSetToNull);


            dispose(ref m_blobFF1);

            dispose(ref m_blobFF2);

            dispose(ref m_blobTimeA);

            dispose(ref m_blobTimeB);

            dispose(ref m_blobTInterp);

            dispose(ref m_blobTInterp1);

            dispose(ref m_blobTInterpInv);

            dispose(ref m_blobTs);

            dispose(ref m_blobX);

            dispose(ref m_blobTop1);

            dispose(ref m_blobTop2);

        }


        private void clear_internal_blobs()

        {

            m_rgLinearBtms.Clear();

            m_rgLinearTops.Clear();

            m_rgActivationBtms.Clear();

            m_rgActivationTops.Clear();

        }


        public override BlobCollection<T> CreateInternalSharedBlobs(int nIdx, CudaDnn<T> cuda, Log log)

        {

            BlobCollection<T> col = new BlobCollection<T>();


            dispose_internal_blobs(false);


            Blob<T> blobFF1 = new Blob<T>(cuda, log);

            blobFF1.Name = "ff1_" + nIdx.ToString();

            col.Add(blobFF1);


            Blob<T> blobFF2 = new Blob<T>(cuda, log);

            blobFF2.Name = "ff2_" + nIdx.ToString();

            col.Add(blobFF2);


            Blob<T> blobTimeA = new Blob<T>(cuda, log);

            blobTimeA.Name = "timeA_" + nIdx.ToString();

            col.Add(blobTimeA);


            Blob<T> blobTimeB = new Blob<T>(cuda, log);

            blobTimeB.Name = "timeB_" + nIdx.ToString();

            col.Add(blobTimeB);


            Blob<T> blobTInterp = new Blob<T>(cuda, log);

            blobTInterp.Name = "tInterp_" + nIdx.ToString();

            col.Add(blobTInterp);


            Blob<T> blobTInterp1 = new Blob<T>(cuda, log);

            blobTInterp1.Name = "tInterp1_" + nIdx.ToString();

            col.Add(blobTInterp1);


            Blob<T> blobTInterpInv = new Blob<T>(cuda, log);

            blobTInterpInv.Name = "tInterpInv_" + nIdx.ToString();

            col.Add(blobTInterpInv);


            Blob<T> blobTs = new Blob<T>(cuda, log);

            blobTs.Name = "ts_" + nIdx.ToString();

            col.Add(blobTs);


            Blob<T> blobX = new Blob<T>(cuda, log);

            blobX.Name = "x_" + nIdx.ToString();

            col.Add(blobX);


            Blob<T> blobTop1 = new Blob<T>(cuda, log);

            blobTop1.Name = "top1_" + nIdx.ToString();

            col.Add(blobTop1);


            Blob<T> blobTop2 = new Blob<T>(cuda, log);

            blobTop2.Name = "top2_" + nIdx.ToString();

            col.Add(blobTop2);


            Blob<T> blobBb = new Blob<T>(cuda, log);

            blobBb.Name = "bb_" + nIdx.ToString();

            col.Add(blobBb);


            for (int i = 0; i < m_param.cfc_unit_param.backbone_layers; i++)

            {

                Blob<T> blobFc = new Blob<T>(cuda, log);

                blobFc.Name = "bb_fc" + (i + 1).ToString() + "_" + nIdx.ToString();

                col.Add(blobFc);


                Blob<T> blobAct = new Blob<T>(cuda, log);

                blobAct.Name = "bb_act" + (i + 1).ToString() + "_" + nIdx.ToString();

                col.Add(blobAct);

            }


            return col;

        }


        public override void SetInternalSharedBlobs(BlobCollection<T> col)

        {

            int nIdx = 0;


            m_bOwnInternalBlobs = false;

            m_blobFF1 = col[nIdx];

            nIdx++;


            m_blobFF2 = col[nIdx];

            nIdx++;


            m_blobTimeA = col[nIdx];

            nIdx++;


            m_blobTimeB = col[nIdx];

            nIdx++;


            m_blobTInterp = col[nIdx];

            nIdx++;


            m_blobTInterp1 = col[nIdx];

            nIdx++;


            m_blobTInterpInv = col[nIdx];

            nIdx++;


            m_blobTs = col[nIdx];

            nIdx++;


            m_blobX = col[nIdx];

            nIdx++;


            m_blobTop1 = col[nIdx];

            nIdx++;


            m_blobTop2 = col[nIdx];

            nIdx++;


            BlobCollection<T> colLin = new BlobCollection<T>();

            while (nIdx < col.Count)

            {

                colLin.Add(col[nIdx]);

                nIdx++;

            }


            m_rgLinearBtms.Clear();

            m_rgLinearTops.Clear();

            m_rgActivationBtms.Clear();

            m_rgActivationTops.Clear();


            nIdx = 0;

            for (int i=0; i<m_param.cfc_unit_param.backbone_layers; i++)

            {

                m_rgLinearBtms.Add(colLin[nIdx]);

                nIdx++;

                m_rgLinearTops.Add(colLin[nIdx]);

                m_rgActivationBtms.Add(colLin[nIdx]);

                nIdx++;

                m_rgActivationTops.Add(colLin[nIdx]);

            }


            colLin.Clear();

        }


        private void addBtmTop(Blob<T> btm, Blob<T> top)

        {

            m_colBtm.Clear();

            m_colBtm.Add(btm);

            m_colTop.Clear();

            m_colTop.Add(top);

        }


        protected override void setup_internal_blobs(BlobCollection<T> col)

        {

            if (col.Count > 0)

                return;

        }


        public override int ExactNumBottomBlobs

        {

            get { return 3; }

        }


        public override int ExactNumTopBlobs

        {

            get { return 1; }

        }


        public override bool ReInitializeParameters(WEIGHT_TARGET target)

        {

            base.ReInitializeParameters(target);

            return true;

        }


        public override void LayerSetUp(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            addBtmTop(colBottom[0], m_rgLinearBtms[0]);

            m_colBtm.Add(colBottom[1]);

            m_cat.Setup(m_colBtm, m_colTop);


            for (int i = 0; i < m_nNumLayers; i++)

            {

                addBtmTop(m_rgLinearBtms[i], m_rgLinearTops[i]);

                m_rgLinearLayers[i].Setup(m_colBtm, m_colTop);

                blobs.Add(m_rgLinearLayers[i].blobs);


                addBtmTop(m_rgActivationBtms[i], m_rgActivationTops[i]);

                m_rgActivationLayers[i].Setup(m_colBtm, m_colTop);


                if (i > 0 && m_rgDropoutLayers != null)

                    m_rgDropoutLayers[i].Setup(m_colBtm, m_colTop);

            }


            Blob<T> blobX = m_rgActivationTops[m_nNumLayers - 1];

            m_blobX.ReshapeLike(blobX);


            // FF1 Layer

            addBtmTop(blobX, m_blobFF1);

            m_ff1.Setup(m_colBtm, m_colTop);

            blobs.Add(m_ff1.blobs);


            // Tanh Layer

            addBtmTop(m_blobFF1, m_blobFF1);

            m_tanh.Setup(m_colBtm, m_colTop);


            // FF2 Layer

            addBtmTop(blobX, m_blobFF2);

            m_ff2.Setup(m_colBtm, m_colTop);

            blobs.Add(m_ff2.blobs);


            addBtmTop(m_blobFF2, m_blobFF2);

            m_tanh.Setup(m_colBtm, m_colTop);


            // Time A Layer

            addBtmTop(blobX, m_blobTimeA);

            m_timeA.Setup(m_colBtm, m_colTop);

            blobs.Add(m_timeA.blobs);


            // Time B Layer

            addBtmTop(blobX, m_blobTimeB);

            m_timeB.Setup(m_colBtm, m_colTop);

            blobs.Add(m_timeB.blobs);


            // T-Interp

            m_blobTInterp.ReshapeLike(m_blobTimeA);

            m_blobTInterpInv.ReshapeLike(m_blobTimeA);

            m_blobTInterp1.ReshapeLike(m_blobTimeA);

            m_blobTInterpOnes.ReshapeLike(m_blobTimeA);


            addBtmTop(m_blobTInterp, colTop[0]);

            m_sigmoid.Setup(m_colBtm, m_colTop);


            m_blobTs.ReshapeLike(m_blobTimeA);

            m_blobTop1.ReshapeLike(colTop[0]);

            m_blobTop2.ReshapeLike(colTop[0]);

        }


        public override void Reshape(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            addBtmTop(colBottom[0], m_rgLinearBtms[0]);

            m_colBtm.Add(colBottom[1]);

            m_cat.Reshape(m_colBtm, m_colTop);


            for (int i = 0; i < m_rgLinearLayers.Length; i++)

            {

                addBtmTop(m_rgLinearBtms[i], m_rgLinearTops[i]);

                m_rgLinearLayers[i].Reshape(m_colBtm, m_colTop);


                addBtmTop(m_rgActivationBtms[i], m_rgActivationTops[i]);

                m_rgActivationLayers[i].Reshape(m_colBtm, m_colTop);


                if (m_rgDropoutLayers != null)

                    m_rgDropoutLayers[i].Reshape(m_colBtm, m_colTop);

            }


            Blob<T> blobX = m_rgActivationTops[m_rgLinearLayers.Length - 1];

            m_blobX.ReshapeLike(blobX);


            // FF1 Layer

            addBtmTop(blobX, m_blobFF1);

            m_ff1.Reshape(m_colBtm, m_colTop);


            // Tanh Layer

            addBtmTop(m_blobFF1, m_blobFF1);

            m_tanh.Reshape(m_colBtm, m_colTop);


            // FF2 Layer

            addBtmTop(blobX, m_blobFF2);

            m_ff2.Reshape(m_colBtm, m_colTop);


            addBtmTop(m_blobFF2, m_blobFF2);

            m_tanh.Reshape(m_colBtm, m_colTop);


            // Time A Layer

            addBtmTop(blobX, m_blobTimeA);

            m_timeA.Reshape(m_colBtm, m_colTop);

            m_blobTs.ReshapeLike(m_blobTimeA);


            m_blobTInterp.ReshapeLike(m_blobTimeA);

            m_blobTInterpInv.ReshapeLike(m_blobTimeA);

            m_blobTInterp1.ReshapeLike(m_blobTimeA);

            m_blobTInterpOnes.ReshapeLike(m_blobTimeA);

            m_blobTInterpOnes.SetData(1.0);


            // Time B Layer

            addBtmTop(blobX, m_blobTimeB);

            m_timeB.Reshape(m_colBtm, m_colTop);


            // Sigmoid Layer

            addBtmTop(m_blobTInterp, colTop[0]);

            m_sigmoid.Reshape(m_colBtm, m_colTop);


            m_blobTop1.ReshapeLike(colTop[0]);

            m_blobTop2.ReshapeLike(colTop[0]);

        }


        protected override void forward(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            addBtmTop(colBottom[0], m_rgLinearBtms[0]);

            m_colBtm.Add(colBottom[1]);

            m_cat.Forward(m_colBtm, m_colTop);


            for (int i = 0; i < m_rgLinearLayers.Length; i++)

            {

                addBtmTop(m_rgLinearBtms[i], m_rgLinearTops[i]);

                m_rgLinearLayers[i].Forward(m_colBtm, m_colTop);


                addBtmTop(m_rgActivationBtms[i], m_rgActivationTops[i]);

                m_rgActivationLayers[i].Forward(m_colBtm, m_colTop);


                if (m_rgDropoutLayers != null)

                    m_rgDropoutLayers[i].Forward(m_colBtm, m_colTop);

            }


            Blob<T> blobX = m_rgActivationTops[m_rgLinearLayers.Length - 1];

            m_blobX.CopyFrom(blobX, false);


            // FF1 Layer

            addBtmTop(blobX, m_blobFF1);

            m_ff1.Forward(m_colBtm, m_colTop);


            // Tanh Layer

            addBtmTop(m_blobFF1, m_blobFF1);

            m_tanh.Forward(m_colBtm, m_colTop);


            // FF2 Layer

            addBtmTop(blobX, m_blobFF2);

            m_ff2.Forward(m_colBtm, m_colTop);


            addBtmTop(m_blobFF2, m_blobFF2);

            m_tanh.Forward(m_colBtm, m_colTop);


            // Time A Layer

            addBtmTop(blobX, m_blobTimeA);

            m_timeA.Forward(m_colBtm, m_colTop);


            // Time B Layer

            addBtmTop(blobX, m_blobTimeB);

            m_timeB.Forward(m_colBtm, m_colTop);


            // Calculate the t-interpolation factor.

            m_cuda.channel_fillfrom(m_blobTs.count(), m_blobTs.num, 1, m_blobTs.channels, colBottom[2].gpu_data, m_blobTs.mutable_gpu_data, DIR.FWD);

            // t_a * ts

            m_cuda.mul(m_blobTInterp.count(), m_blobTimeA.gpu_data, m_blobTs.gpu_data, m_blobTInterp.mutable_gpu_data);


            // t_interp = t_a * ts + t_b

            m_cuda.add(m_blobTInterp.count(), m_blobTimeB.gpu_data, m_blobTInterp.gpu_data, m_blobTInterp.mutable_gpu_data);


            // Sigmoid Layer

            addBtmTop(m_blobTInterp, m_blobTInterp);

            m_sigmoid.Forward(m_colBtm, m_colTop);


            if (m_param.cfc_unit_param.no_gate)

            {

                // t_interp * ff2

                m_cuda.mul(m_blobTop1.count(), m_blobTInterp.gpu_data, m_blobFF2.gpu_data, m_blobTop1.mutable_gpu_data);

                // ff1 + t_interp * ff2

                m_cuda.add(m_blobTop2.count(), m_blobFF1.gpu_data, m_blobTop1.gpu_data, m_blobTop2.mutable_gpu_data);

                colTop[0].CopyFrom(m_blobTop2);

            }

            else

            {

                // 1.0 - t_interp

                m_blobTInterpInv.SetData(1.0);

                m_cuda.sub(m_blobTInterpInv.count(), m_blobTInterpInv.gpu_data, m_blobTInterp.gpu_data, m_blobTInterpInv.mutable_gpu_data);

                // ff1 * (1.0 - t_interp)

                m_cuda.mul(m_blobTInterpInv.count(), m_blobTInterpInv.gpu_data, m_blobFF1.gpu_data, m_blobTop1.mutable_gpu_data);

                // t_interp * ff2

                m_cuda.mul(colTop[0].count(), m_blobTInterp.gpu_data, m_blobFF2.gpu_data, m_blobTop2.mutable_gpu_data);

                // ff1 * (1.0 - t_interp) + t_interp * ff2

                m_cuda.add(colTop[0].count(), m_blobTop1.gpu_data, m_blobTop2.gpu_data, colTop[0].mutable_gpu_data);

            }

        }


        protected override void backward(BlobCollection<T> colTop, List<bool> rgbPropagateDown, BlobCollection<T> colBottom)

        {

            if (m_param.cfc_unit_param.no_gate)

            {

                // grad = top.grad * ones

                m_blobFF1.CopyFrom(colTop[0], true);


                // grad = top.grad * t-interp

                m_cuda.mul(m_blobFF2.count(), colTop[0].gpu_diff, m_blobTInterp.gpu_data, m_blobFF2.mutable_gpu_diff);


                // grad = top.grad * ff2

                m_cuda.mul(m_blobTInterp.count(), colTop[0].gpu_diff, m_blobFF2.gpu_data, m_blobTInterp1.mutable_gpu_diff);

            }

            else

            {

                // ff1 grad = top.trad * (1.0 - t_interp)

                m_cuda.sub(m_blobFF1.count(), m_blobTInterpOnes.gpu_data, m_blobTInterp.gpu_data, m_blobFF1.mutable_gpu_diff);

                m_cuda.mul(m_blobFF1.count(), m_blobFF1.gpu_diff, colTop[0].gpu_diff, m_blobFF1.mutable_gpu_diff);


                // ff2 grad = top.grad * t_interp

                m_cuda.mul(m_blobFF2.count(), colTop[0].gpu_diff, m_blobTInterp.gpu_data, m_blobFF2.mutable_gpu_diff);


                // ti grad = top.grad * (ff2 - ff1)

                m_cuda.sub(m_blobTInterp1.count(), m_blobFF2.gpu_data, m_blobFF1.gpu_data, m_blobTInterp1.mutable_gpu_diff);

                m_cuda.mul(m_blobTInterp1.count(), m_blobTInterp1.gpu_diff, colTop[0].gpu_diff, m_blobTInterp1.mutable_gpu_diff);

            }


            // Sigmoid Grad

            m_blobTInterp1.CopyFrom(m_blobTInterp);

            addBtmTop(m_blobTInterp, m_blobTInterp1);

            m_sigmoid.Backward(m_colTop, rgbPropagateDown, m_colBtm);


            // t_b grad = t-interp grad * 1.0

            m_blobTimeB.CopyFrom(m_blobTInterp, true);


            // t_a grad = t-interp grad * ts

            m_cuda.mul(m_blobTimeA.count(), m_blobTInterp.gpu_diff, m_blobTs.gpu_data, m_blobTimeA.mutable_gpu_diff);


            // ts grad = t-interp grad * t_a

            m_cuda.mul(m_blobTs.count(), m_blobTInterp.gpu_diff, m_blobTimeA.gpu_data, m_blobTs.mutable_gpu_diff);

            m_cuda.channel_sum(m_blobTs.count(), 1, m_blobTs.num, m_blobTs.channels, m_blobTs.gpu_diff, colBottom[2].mutable_gpu_diff, false);


            Blob<T> blobX = m_rgActivationTops[m_rgActivationTops.Count-1];

            blobX.SetDiff(0);


            // time_b grad

            addBtmTop(m_blobX, m_blobTimeB);

            m_timeB.Backward(m_colTop, rgbPropagateDown, m_colBtm);

            m_cuda.add(m_blobX.count(), m_blobX.gpu_diff, blobX.gpu_diff, blobX.mutable_gpu_diff);


            // time_a grad

            addBtmTop(m_blobX, m_blobTimeA);

            m_timeA.Backward(m_colTop, rgbPropagateDown, m_colBtm);

            m_cuda.add(m_blobX.count(), m_blobX.gpu_diff, blobX.gpu_diff, blobX.mutable_gpu_diff);


            // ff2 grad

            addBtmTop(m_blobFF2, m_blobFF2);

            m_tanh.Backward(m_colTop, rgbPropagateDown, m_colBtm);


            addBtmTop(m_blobX, m_blobFF2);

            m_ff2.Backward(m_colTop, rgbPropagateDown, m_colBtm);

            m_cuda.add(m_blobX.count(), m_blobX.gpu_diff, blobX.gpu_diff, blobX.mutable_gpu_diff);


            // ff1 grad

            addBtmTop(m_blobFF1, m_blobFF1);

            m_tanh.Backward(m_colTop, rgbPropagateDown, m_colBtm);


            addBtmTop(m_blobX, m_blobFF1);

            m_ff1.Backward(m_colTop, rgbPropagateDown, m_colBtm);

            m_cuda.add(m_blobX.count(), m_blobX.gpu_diff, blobX.gpu_diff, blobX.mutable_gpu_diff);


            // Backbone grad

            for (int i = m_rgLinearLayers.Length - 1; i >= 0; i--)

            {

                addBtmTop(m_rgActivationBtms[i], m_rgActivationTops[i]);


                if (m_rgDropoutLayers != null)

                    m_rgDropoutLayers[i].Backward(m_colTop, rgbPropagateDown, m_colBtm);


                m_rgActivationLayers[i].Backward(m_colTop, rgbPropagateDown, m_colBtm);


                addBtmTop(m_rgLinearBtms[i], m_rgLinearTops[i]);

                m_rgLinearLayers[i].Backward(m_colTop, rgbPropagateDown, m_colBtm);

            }


            addBtmTop(colBottom[0], m_rgLinearBtms[0]);

            m_colBtm.Add(colBottom[1]);

            m_cat.Backward(m_colTop, new List<bool>() { true, true }, m_colBtm);

        }

    }

}

MyCaffe.basecode.Log
The Log class provides general output in text form.
Definition: Log.cs:13

MyCaffe.common.BlobCollection
The BlobCollection contains a list of Blobs.
Definition: BlobCollection.cs:16

MyCaffe.common.BlobCollection.Add
void Add(Blob< T > b)
Add a new Blob to the collection.
Definition: BlobCollection.cs:92

MyCaffe.common.BlobCollection.Count
int Count
Returns the number of items in the collection.
Definition: BlobCollection.cs:30

MyCaffe.common.BlobCollection.Clear
void Clear(bool bDispose=false)
Remove all items from the collection.
Definition: BlobCollection.cs:135

MyCaffe.common.BlobCollection.CopyFrom
void CopyFrom(BlobCollection< T > bSrc, bool bCopyDiff=false)
Copy the data or diff from another BlobCollection into this one.
Definition: BlobCollection.cs:266

MyCaffe.common.Blob
The Blob is the main holder of data that moves through the Layers of the Net.
Definition: Blob.cs:25

MyCaffe.common.Blob.channels
int channels
DEPRECIATED; legacy shape accessor channels: use shape(1) instead.
Definition: Blob.cs:800

MyCaffe.common.Blob.SetData
void SetData(T[] rgData, int nCount=-1, bool bSetCount=true)
Sets a number of items within the Blob's data.
Definition: Blob.cs:1922

MyCaffe.common.Blob.mutable_gpu_diff
long mutable_gpu_diff
Returns the diff GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1555

MyCaffe.common.Blob.mutable_gpu_data
long mutable_gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1487

MyCaffe.common.Blob.CopyFrom
void CopyFrom(Blob< T > src, int nSrcOffset, int nDstOffset, int nCount, bool bCopyData, bool bCopyDiff)
Copy from a source Blob.
Definition: Blob.cs:903

MyCaffe.common.Blob.count
int count()
Returns the total number of items in the Blob.
Definition: Blob.cs:739

MyCaffe.common.Blob.ReshapeLike
void ReshapeLike(Blob< T > b, bool? bUseHalfSize=null)
Reshape this Blob to have the same shape as another Blob.
Definition: Blob.cs:648

MyCaffe.common.Blob.Name
string Name
Get/set the name of the Blob.
Definition: Blob.cs:2184

MyCaffe.common.Blob.gpu_diff
long gpu_diff
Returns the diff GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1541

MyCaffe.common.Blob.SetDiff
void SetDiff(double dfVal, int nIdx=-1)
Either sets all of the diff items in the Blob to a given value, or alternatively only sets a single i...
Definition: Blob.cs:1981

MyCaffe.common.Blob.num
int num
DEPRECIATED; legacy shape accessor num: use shape(0) instead.
Definition: Blob.cs:792

MyCaffe.common.Blob.gpu_data
long gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1479

MyCaffe.common.CudaDnn
The CudaDnn object is the main interface to the Low-Level Cuda C++ DLL.
Definition: CudaDnn.cs:969

MyCaffe.layers.Layer
An interface for the units of computation which can be composed into a Net.
Definition: Layer.cs:31

MyCaffe.layers.Layer.m_log
Log m_log
Specifies the Log for output.
Definition: Layer.cs:43

MyCaffe.layers.Layer.m_param
LayerParameter m_param
Specifies the LayerParameter describing the Layer.
Definition: Layer.cs:47

MyCaffe.layers.Layer.Backward
void Backward(BlobCollection< T > colTop, List< bool > rgbPropagateDown, BlobCollection< T > colBottom)
Given the top Blob error gradients, compute the bottom Blob error gradients.
Definition: Layer.cs:815

MyCaffe.layers.Layer.Forward
double Forward(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Given the bottom (input) Blobs, this function computes the top (output) Blobs and the loss.
Definition: Layer.cs:728

MyCaffe.layers.Layer.Reshape
abstract void Reshape(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Adjust the shapes of top blobs and internal buffers to accomodate the shapes of the bottom blobs.

MyCaffe.layers.Layer.Dispose
void Dispose()
Releases all GPU and host resources used by the Layer.
Definition: Layer.cs:180

MyCaffe.layers.Layer.m_cuda
CudaDnn< T > m_cuda
Specifies the CudaDnn connection to Cuda.
Definition: Layer.cs:39

MyCaffe.layers.Layer.Setup
void Setup(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Implements common Layer setup functionality.
Definition: Layer.cs:439

MyCaffe.layers.Layer.Create
static Layer< T > Create(CudaDnn< T > cuda, Log log, LayerParameter p, CancelEvent evtCancel, IXDatabaseBase db=null, TransferInput trxinput=null)
Create a new Layer based on the LayerParameter.
Definition: Layer.cs:1468

MyCaffe.layers.Layer.m_type
LayerParameter.LayerType m_type
Specifies the Layer type.
Definition: Layer.cs:35

MyCaffe.layers.Layer.blobs
BlobCollection< T > blobs
Returns the collection of learnable parameter Blobs for the Layer.
Definition: Layer.cs:875

MyCaffe.layers.Layer.convertLayerParam
LayerParameter convertLayerParam(LayerParameter pChild, LayerParameter pParent)
Called to convert a parent LayerParameterEx, used in blob sharing, with a child layer parameter.
Definition: Layer.cs:1134

MyCaffe.layers.lnn.CfcUnitLayer
The CfcUnitLayer implements the Closed form Continuous Cell (CfcCell) layer.
Definition: CfcUnitLayer.cs:24

MyCaffe.layers.lnn.CfcUnitLayer.dispose
override void dispose()
Releases all GPU and host resources used by the Layer.
Definition: CfcUnitLayer.cs:231

MyCaffe.layers.lnn.CfcUnitLayer.CfcUnitLayer
CfcUnitLayer(CudaDnn< T > cuda, Log log, LayerParameter p)
The CfcUnitLayer constructor.
Definition: CfcUnitLayer.cs:62

MyCaffe.layers.lnn.CfcUnitLayer.CreateInternalSharedBlobs
override BlobCollection< T > CreateInternalSharedBlobs(int nIdx, CudaDnn< T > cuda, Log log)
Create the internal shared blobs used by the layer for a given index.
Definition: CfcUnitLayer.cs:298

MyCaffe.layers.lnn.CfcUnitLayer.Reshape
override void Reshape(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Reshape the bottom (input) and top (output) blobs.
Definition: CfcUnitLayer.cs:549

MyCaffe.layers.lnn.CfcUnitLayer.forward
override void forward(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Forward computation
Definition: CfcUnitLayer.cs:621

MyCaffe.layers.lnn.CfcUnitLayer.LayerSetUp
override void LayerSetUp(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Setup the layer.
Definition: CfcUnitLayer.cs:481

MyCaffe.layers.lnn.CfcUnitLayer.SetInternalSharedBlobs
override void SetInternalSharedBlobs(BlobCollection< T > col)
Set the internal shared blobs to a set of external blobs.
Definition: CfcUnitLayer.cs:370

MyCaffe.layers.lnn.CfcUnitLayer.setup_internal_blobs
override void setup_internal_blobs(BlobCollection< T > col)
Derivative layers should add all internal blobws to the 'col' provided.
Definition: CfcUnitLayer.cs:443

MyCaffe.layers.lnn.CfcUnitLayer.ExactNumTopBlobs
override int ExactNumTopBlobs
Returns the exact number of required top (output) Blobs: attn
Definition: CfcUnitLayer.cs:461

MyCaffe.layers.lnn.CfcUnitLayer.ReInitializeParameters
override bool ReInitializeParameters(WEIGHT_TARGET target)
Re-initialize the parameters of the layer.
Definition: CfcUnitLayer.cs:470

MyCaffe.layers.lnn.CfcUnitLayer.backward
override void backward(BlobCollection< T > colTop, List< bool > rgbPropagateDown, BlobCollection< T > colBottom)
Computes the error gradient w.r.t. the CfcUnit value inputs.
Definition: CfcUnitLayer.cs:715

MyCaffe.layers.lnn.CfcUnitLayer.ExactNumBottomBlobs
override int ExactNumBottomBlobs
Returns the exact number of required bottom (input) Blobs: input, hx, ts
Definition: CfcUnitLayer.cs:453

MyCaffe.layers.lnn.LnnUnitLayer
The LnnUnitLayer implements the base class to the Cfc and Ltc Unit layers.
Definition: LnnUnitLayer.cs:19

MyCaffe.layers.lnn.LnnUnitLayer.m_bOwnInternalBlobs
bool m_bOwnInternalBlobs
Specifies member variable used to track whether or not the internal blobs are owned by this layer.
Definition: LnnUnitLayer.cs:23

MyCaffe.param.ConcatParameter.axis
int axis
The axis along which to concatenate – may be negative to index from the end (e.g.,...
Definition: ConcatParameter.cs:40

MyCaffe.param.DropoutParameter.dropout_ratio
double dropout_ratio
Specifies the dropout ratio. (e.g. the probability that values will be dropped out and set to zero....
Definition: DropoutParameter.cs:63

MyCaffe.param.FillerParameter
Specifies the filler parameters used to create each Filler.
Definition: FillerParameter.cs:16

MyCaffe.param.InnerProductParameter.weight_filler
FillerParameter weight_filler
The filler for the weights.
Definition: InnerProductParameter.cs:119

MyCaffe.param.InnerProductParameter.bias_filler
FillerParameter bias_filler
The filler for the bias.
Definition: InnerProductParameter.cs:130

MyCaffe.param.InnerProductParameter.num_output
uint num_output
The number of outputs for the layer.
Definition: InnerProductParameter.cs:85

MyCaffe.param.InnerProductParameter.bias_term
bool bias_term
Whether to have bias terms or not.
Definition: InnerProductParameter.cs:108

MyCaffe.param.LayerParameter
Specifies the base parameter for all layers.
Definition: LayerParameter.cs:24

MyCaffe.param.LayerParameter.inner_product_param
InnerProductParameter inner_product_param
Returns the parameter set when initialized with LayerType.INNERPRODUCT
Definition: LayerParameter.cs:2452

MyCaffe.param.LayerParameter.concat_param
ConcatParameter concat_param
Returns the parameter set when initialized with LayerType.CONCAT
Definition: LayerParameter.cs:2099

MyCaffe.param.LayerParameter.cfc_unit_param
CfcUnitParameter cfc_unit_param
Returns the parameter set when initialized with LayerType.CFC_UNIT
Definition: LayerParameter.cs:2081

MyCaffe.param.LayerParameter.LayerType
LayerType
Specifies the layer type.
Definition: LayerParameter.cs:110

MyCaffe.param.LayerParameter.dropout_param
DropoutParameter dropout_param
Returns the parameter set when initialized with LayerType.DROPOUT
Definition: LayerParameter.cs:2290

MyCaffe.param.lnn.CfcUnitParameter
Specifies the parameters for the CfcUnitLayer used by the CfCLayer.
Definition: CfcUnitParameter.cs:21

MyCaffe.param.lnn.CfcUnitParameter.ACTIVATION
ACTIVATION
Defines the activation function used by the backbone.
Definition: CfcUnitParameter.cs:35

MyCaffe.param.lnn.CfcUnitParameter.no_gate
bool no_gate
Specifies whether to use the gate or not (when true, the no gate mode is used to calculate the forwar...
Definition: CfcUnitParameter.cs:68

MyCaffe.param.lnn.CfcUnitParameter.backbone_activation
ACTIVATION backbone_activation
Specifies the backbone activation function.
Definition: CfcUnitParameter.cs:138

MyCaffe.param.lnn.CfcUnitParameter.hidden_size
int hidden_size
Specifies the hidden size used to size the backbone units and other internal layers.
Definition: CfcUnitParameter.cs:98

MyCaffe.param.lnn.CfcUnitParameter.backbone_units
int backbone_units
Specifies the number of backbone units
Definition: CfcUnitParameter.cs:108

MyCaffe.param.lnn.CfcUnitParameter.backbone_layers
int backbone_layers
Specifies the number of backbone layers.
Definition: CfcUnitParameter.cs:118

MyCaffe.param.lnn.CfcUnitParameter.backbone_dropout_ratio
float backbone_dropout_ratio
Specifies the backbone dropout ratio.
Definition: CfcUnitParameter.cs:128

MyCaffe.basecode
The MyCaffe.basecode contains all generic types used throughout MyCaffe.
Definition: Annotation.cs:12

MyCaffe.common
The MyCaffe.common namespace contains common MyCaffe classes.
Definition: BatchInput.cs:8

MyCaffe.common.DIR
DIR
Defines the direction of data flow.
Definition: CudaDnn.cs:22

MyCaffe.common.WEIGHT_TARGET
WEIGHT_TARGET
Defines the type of weight to target in re-initializations.
Definition: Interfaces.cs:38

MyCaffe.layers.lnn
The MyCaffe.layers.lnn namespace contains all Liquid Neural Network (LNN) related layers.
Definition: LayerFactory.cs:15

MyCaffe.param.lnn
Definition: CfcParameter.cs:9

MyCaffe.param
The MyCaffe.param namespace contains parameters used to create models.
Definition: AttentionParameter.cs:9

MyCaffe
The MyCaffe namespace contains the main body of MyCaffe code that closesly tracks the C++ Caffe open-...
Definition: Annotation.cs:12

System
Definition: Component.cs:11