mycaffe/html/_recurrent_parameter_8cs_source.html

using System;

using System.Collections.Generic;

using System.ComponentModel;

using System.IO;

using System.Linq;

using System.Text;

using System.Threading.Tasks;

using MyCaffe.basecode;


namespace MyCaffe.param

{

    [Serializable]

    [TypeConverter(typeof(ExpandableObjectConverter))]

    public class RecurrentParameter : EngineParameter

    {

        uint m_nNumOutput = 0;

        FillerParameter m_weight_filler = new FillerParameter("xavier");

        FillerParameter m_bias_filler = new FillerParameter("constant", 0.1);

        bool m_bDebugInfo = false;

        bool m_bExposeHiddenInput = false;

        bool m_bExposeHiddenOutput = false;

        uint m_nNumLayers = 1; // cuDnn only

        double m_dfDropoutRatio = 0.0; // cuDnn only

        long m_lDropoutSeed = 0; // cuDnn only

        bool m_bBidirectional = false; // cuDnn only

        bool m_bCudnnEnableTensorCores = false; // cuDnn only

        bool m_bBatchFirst = false; // input and output have the batch in the first dim.

        bool m_bAutoRepeatHiddenStatesAcrossLayers = false;

        bool m_bUseCudnnRnn8IfSupported = false; // cuDnn only


        public RecurrentParameter()

        {

        }


        public string useCaffeReason()

        {

            if (engine == Engine.CAFFE || engine == Engine.DEFAULT)

                return "The engine setting is set on CAFFE or DEFAULT.";


            return "";

        }


        public bool use_cudnn_rnn8_if_supported

        {

            get { return m_bUseCudnnRnn8IfSupported; }

            set { m_bUseCudnnRnn8IfSupported = value; }

        }


        [Description("Auto repeat the hidden and cell states so that a separate state is fed to each layer.")]

        public bool auto_repeat_hidden_states_across_layers

        {

            get { return m_bAutoRepeatHiddenStatesAcrossLayers; }

            set { m_bAutoRepeatHiddenStatesAcrossLayers = value; }

        }


        [Description("The input and outputs are shaped with the batch in the first dimension.")]

        public bool batch_first

        {

            get { return m_bBatchFirst; }

            set { m_bBatchFirst = value; }

        }


        public bool useCudnn()

        {

            if (engine == Engine.CAFFE || engine == Engine.DEFAULT)

                return false;


            return true;

        }


        [Description("Specifies whether the network is bidirectional (<i>true</i>) or unidirectional (<i>false</i> - default).")]

        public bool bidirectional

        {

            get { return m_bBidirectional; }

            set { m_bBidirectional = value; }

        }


        [Description("Specifies the dimension of the output (and usually hidden state) representation -- must be explicitly set to non-zero.")]

        public uint num_output

        {

            get { return m_nNumOutput; }

            set { m_nNumOutput = value; }

        }


        [Description("Specifies the filler for the weights.")]

        public FillerParameter weight_filler

        {

            get { return m_weight_filler; }

            set { m_weight_filler = value; }

        }


        [Description("Specifies the filler for the bias.")]

        public FillerParameter bias_filler

        {

            get { return m_bias_filler; }

            set { m_bias_filler = value; }

        }


        [Description("Specifies whether to enable displaying debug info in the unrolled recurrent net.")]

        public bool debug_info

        {

            get { return m_bDebugInfo; }

            set { m_bDebugInfo = value; }

        }


        [Description("Specifies whether to add as additional inputs (bottoms) the initial hidden state blobs.  The number of additional bottom/top blobs required depends on the recurrent architecture -- e.g., 1 for RNN's, 2 for LSTM's.")]

        public bool expose_hidden_input

        {

            get { return m_bExposeHiddenInput; }

            set { m_bExposeHiddenInput = value; }

        }


        [Description("Specifies whether to add as additional outputs (tops) the final timestep hidden state blobs.  The number of additional bottom/top blobs required depends on the recurrent architecture -- e.g., 1 for RNN's, 2 for LSTM's.")]

        public bool expose_hidden_output

        {

            get { return m_bExposeHiddenOutput; }

            set { m_bExposeHiddenOutput = value; }

        }


        [Description("Specifies the number of LSTM layers to implement (cuDnn only).")]

        public uint num_layers

        {

            get { return m_nNumLayers; }

            set { m_nNumLayers = value; }

        }


        [Description("Specifies the dropout ratio (cuDnn only). (e.g. the probability that values will be dropped out and set to zero.  A value of 0.25 = 25% chance that a value is set to 0, and dropped out.)")]

        public double dropout_ratio

        {

            get { return m_dfDropoutRatio; }

            set { m_dfDropoutRatio = value; }

        }


        [Description("Specifies the random number generator seed used with the cuDnn dropout - the default value of '0' uses a random seed (cuDnn only).")]

        public long dropout_seed

        {

            get { return m_lDropoutSeed; }

            set { m_lDropoutSeed = value; }

        }


        [Description("Specifies to enable CUDA tensor cores when performing the rnn operations which is faster but not supported by all GPU's.  When not supported, the default math is used.")]

        public bool cudnn_enable_tensor_cores

        {

            get { return m_bCudnnEnableTensorCores; }

            set { m_bCudnnEnableTensorCores = value; }

        }


        public override object Load(BinaryReader br, bool bNewInstance = true)

        {

            RawProto proto = RawProto.Parse(br.ReadString());

            RecurrentParameter p = FromProto(proto);


            if (!bNewInstance)

                Copy(p);


            return p;

        }


        public override LayerParameterBase Clone()

        {

            RecurrentParameter p = new RecurrentParameter();

            p.Copy(this);

            return p;

        }


        public override void Copy(LayerParameterBase src)

        {

            base.Copy(src);


            if (src is RecurrentParameter)

            {

                RecurrentParameter p = (RecurrentParameter)src;

                m_nNumOutput = p.num_output;

                m_weight_filler = p.weight_filler.Clone();

                m_bias_filler = p.bias_filler.Clone();

                m_bDebugInfo = p.debug_info;

                m_bExposeHiddenInput = p.expose_hidden_input;

                m_bExposeHiddenOutput = p.expose_hidden_output;

                m_dfDropoutRatio = p.dropout_ratio;

                m_lDropoutSeed = p.dropout_seed;

                m_nNumLayers = p.num_layers;

                m_bBidirectional = p.bidirectional;

                m_bCudnnEnableTensorCores = p.m_bCudnnEnableTensorCores;

                m_bBatchFirst = p.batch_first;

                m_bAutoRepeatHiddenStatesAcrossLayers = p.auto_repeat_hidden_states_across_layers;

                m_bUseCudnnRnn8IfSupported = p.use_cudnn_rnn8_if_supported;

            }

        }


        public override RawProto ToProto(string strName)

        {

            RawProto rpBase = base.ToProto("engine");

            RawProtoCollection rgChildren = new RawProtoCollection();


            rgChildren.Add(rpBase.Children);

            rgChildren.Add("num_output", num_output.ToString());


            if (weight_filler != null)

                rgChildren.Add(weight_filler.ToProto("weight_filler"));


            if (bias_filler != null)

                rgChildren.Add(bias_filler.ToProto("bias_filler"));


            rgChildren.Add("debug_info", debug_info.ToString());

            rgChildren.Add("expose_hidden", (expose_hidden_input && expose_hidden_output).ToString());

            rgChildren.Add("expose_hidden_input", expose_hidden_input.ToString());

            rgChildren.Add("expose_hidden_output", expose_hidden_output.ToString());

            rgChildren.Add("batch_first", batch_first.ToString());

            rgChildren.Add("auto_repeat_hidden_states_across_layers", auto_repeat_hidden_states_across_layers.ToString());

            rgChildren.Add("use_cudnn_rnn8_if_supported", use_cudnn_rnn8_if_supported.ToString());


            if (engine != Engine.CAFFE)

            {

                rgChildren.Add("dropout_ratio", dropout_ratio.ToString());

                rgChildren.Add("dropout_seed", dropout_seed.ToString());

                rgChildren.Add("num_layers", num_layers.ToString());

                rgChildren.Add("bidirectional", bidirectional.ToString());

            }


            rgChildren.Add("cudnn_enable_tensor_cores", cudnn_enable_tensor_cores.ToString());


            return new RawProto(strName, "", rgChildren);

        }


        public static new RecurrentParameter FromProto(RawProto rp)

        {

            string strVal;

            RecurrentParameter p = new RecurrentParameter();


            ((EngineParameter)p).Copy(EngineParameter.FromProto(rp));


            if ((strVal = rp.FindValue("num_output")) != null)

                p.num_output = uint.Parse(strVal);


            RawProto rpWeightFiller = rp.FindChild("weight_filler");

            if (rpWeightFiller != null)

                p.weight_filler = FillerParameter.FromProto(rpWeightFiller);


            RawProto rpBiasFiller = rp.FindChild("bias_filler");

            if (rpBiasFiller != null)

                p.bias_filler = FillerParameter.FromProto(rpBiasFiller);


            if ((strVal = rp.FindValue("debug_info")) != null)

                p.debug_info = bool.Parse(strVal);


            if ((strVal = rp.FindValue("expose_hidden")) != null)

            {

                p.expose_hidden_input = bool.Parse(strVal);

                p.expose_hidden_output = bool.Parse(strVal);

            }


            if ((strVal = rp.FindValue("expose_hidden_input")) != null)

                p.expose_hidden_input = bool.Parse(strVal);


            if ((strVal = rp.FindValue("expose_hidden_output")) != null)

                p.expose_hidden_output = bool.Parse(strVal);


            if ((strVal = rp.FindValue("dropout_ratio")) != null)

                p.dropout_ratio = ParseDouble(strVal);


            if ((strVal = rp.FindValue("dropout_seed")) != null)

                p.dropout_seed = long.Parse(strVal);


            if ((strVal = rp.FindValue("num_layers")) != null)

                p.num_layers = uint.Parse(strVal);


            if ((strVal = rp.FindValue("bidirectional")) != null)

                p.bidirectional = bool.Parse(strVal);


            if ((strVal = rp.FindValue("cudnn_enable_tensor_cores")) != null)

                p.cudnn_enable_tensor_cores = bool.Parse(strVal);


            if ((strVal= rp.FindValue("batch_first")) != null)

                p.batch_first = bool.Parse(strVal);


            if ((strVal = rp.FindValue("auto_repeat_hidden_states_across_layers")) != null)

                p.auto_repeat_hidden_states_across_layers = bool.Parse(strVal);


            if ((strVal = rp.FindValue("use_cudnn_rnn8_if_supported")) != null)

                p.use_cudnn_rnn8_if_supported = bool.Parse(strVal);


            return p;

        }

    }

}

MyCaffe.basecode.BaseParameter.ParseDouble
static double ParseDouble(string strVal)
Parse double values using the US culture if the decimal separator = '.', then using the native cultur...
Definition: BaseParameter.cs:35

MyCaffe.basecode.RawProtoCollection
The RawProtoCollection class is a list of RawProto objects.
Definition: RawProtoCollection.cs:12

MyCaffe.basecode.RawProtoCollection.Add
void Add(RawProto p)
Adds a RawProto to the collection.
Definition: RawProtoCollection.cs:55

MyCaffe.basecode.RawProto
The RawProto class is used to parse and output Google prototxt file data.
Definition: RawProto.cs:17

MyCaffe.basecode.RawProto.Children
RawProtoCollection Children
Returns a collection of this nodes child nodes.
Definition: RawProto.cs:96

MyCaffe.basecode.RawProto.FindChild
RawProto FindChild(string strName)
Searches for a given node.
Definition: RawProto.cs:231

MyCaffe.basecode.RawProto.Parse
static RawProto Parse(string str)
Parses a prototxt and places it in a new RawProto.
Definition: RawProto.cs:306

MyCaffe.basecode.RawProto.FindValue
string FindValue(string strName)
Searches for a falue of a node within this nodes children.
Definition: RawProto.cs:105

MyCaffe.param.EngineParameter
Specifies whether to use the NVIDIA cuDnn version or Caffe version of a given forward/backward operat...
Definition: EngineParameter.cs:17

MyCaffe.param.EngineParameter.engine
Engine engine
Specifies the Engine in use.
Definition: EngineParameter.cs:49

MyCaffe.param.EngineParameter.EngineParameter
EngineParameter()
Constructor for the parameter.
Definition: EngineParameter.cs:40

MyCaffe.param.EngineParameter.FromProto
static EngineParameter FromProto(RawProto rp)
Parses the parameter from a RawProto.
Definition: EngineParameter.cs:102

MyCaffe.param.EngineParameter.Engine
Engine
Defines the type of engine to use.
Definition: EngineParameter.cs:24

MyCaffe.param.FillerParameter
Specifies the filler parameters used to create each Filler.
Definition: FillerParameter.cs:16

MyCaffe.param.FillerParameter.FromProto
static FillerParameter FromProto(RawProto rp)
Parses the parameter from a RawProto.
Definition: FillerParameter.cs:350

MyCaffe.param.FillerParameter.ToProto
override RawProto ToProto(string strName)
Convert the parameter into a RawProto.
Definition: FillerParameter.cs:314

MyCaffe.param.FillerParameter.Clone
FillerParameter Clone()
Creates a new copy of this instance of the parameter.
Definition: FillerParameter.cs:293

MyCaffe.param.LayerParameterBase
The LayerParameterBase is the base class for all other layer specific parameters.
Definition: LayerParameterBase.cs:18

MyCaffe.param.RecurrentParameter
Specifies the parameters used by the RecurrentLayer.
Definition: RecurrentParameter.cs:18

MyCaffe.param.RecurrentParameter.Copy
override void Copy(LayerParameterBase src)
Copy on parameter to another.
Definition: RecurrentParameter.cs:237

MyCaffe.param.RecurrentParameter.FromProto
static new RecurrentParameter FromProto(RawProto rp)
Parses the parameter from a RawProto.
Definition: RecurrentParameter.cs:306

MyCaffe.param.RecurrentParameter.use_cudnn_rnn8_if_supported
bool use_cudnn_rnn8_if_supported
Specifies to use cuDnn RNN8 if supported (requires cuDnn 8.0 or higher), (default = false).
Definition: RecurrentParameter.cs:55

MyCaffe.param.RecurrentParameter.debug_info
bool debug_info
Whether to enable displaying debug info in the unrolled recurrent net.
Definition: RecurrentParameter.cs:141

MyCaffe.param.RecurrentParameter.num_layers
uint num_layers
The number of LSTM layers to implement.
Definition: RecurrentParameter.cs:176

MyCaffe.param.RecurrentParameter.num_output
uint num_output
The dimension of the output (and usually hidden state) representation – must be explicitly set to non...
Definition: RecurrentParameter.cs:111

MyCaffe.param.RecurrentParameter.weight_filler
FillerParameter weight_filler
The filler for the weights.
Definition: RecurrentParameter.cs:121

MyCaffe.param.RecurrentParameter.expose_hidden_output
bool expose_hidden_output
Whether to add as additional outputs (tops) the final timestep hidden state blobs....
Definition: RecurrentParameter.cs:165

MyCaffe.param.RecurrentParameter.bidirectional
bool bidirectional
Specifies whether the network is bidirectional (true) or unidirectional (false - default).
Definition: RecurrentParameter.cs:100

MyCaffe.param.RecurrentParameter.batch_first
bool batch_first
The input and outputs are shaped with the batch in the first dimension.
Definition: RecurrentParameter.cs:75

MyCaffe.param.RecurrentParameter.dropout_seed
long dropout_seed
Specifies the seed used by cuDnn for random number generation.
Definition: RecurrentParameter.cs:198

MyCaffe.param.RecurrentParameter.useCudnn
bool useCudnn()
Queries whether or not to use NVIDIA's cuDnn.
Definition: RecurrentParameter.cs:87

MyCaffe.param.RecurrentParameter.RecurrentParameter
RecurrentParameter()
Constructor for the parameter.
Definition: RecurrentParameter.cs:35

MyCaffe.param.RecurrentParameter.dropout_ratio
double dropout_ratio
Specifies the dropout ratio. (e.g. the probability that values will be dropped out and set to zero....
Definition: RecurrentParameter.cs:187

MyCaffe.param.RecurrentParameter.bias_filler
FillerParameter bias_filler
The filler for the bias.
Definition: RecurrentParameter.cs:131

MyCaffe.param.RecurrentParameter.Load
override object Load(BinaryReader br, bool bNewInstance=true)
Load the parameter from a binary reader.
Definition: RecurrentParameter.cs:217

MyCaffe.param.RecurrentParameter.ToProto
override RawProto ToProto(string strName)
Convert the parameter into a RawProto.
Definition: RecurrentParameter.cs:266

MyCaffe.param.RecurrentParameter.cudnn_enable_tensor_cores
bool cudnn_enable_tensor_cores
Specifies to enable the CUDA tensor cores when performing the rnn operations which is faster but not ...
Definition: RecurrentParameter.cs:211

MyCaffe.param.RecurrentParameter.auto_repeat_hidden_states_across_layers
bool auto_repeat_hidden_states_across_layers
Auto repeat the hidden and cell states so that a separate state is fed to each layer.
Definition: RecurrentParameter.cs:65

MyCaffe.param.RecurrentParameter.Clone
override LayerParameterBase Clone()
Creates a new copy of this instance of the parameter.
Definition: RecurrentParameter.cs:229

MyCaffe.param.RecurrentParameter.useCaffeReason
string useCaffeReason()
Returns the reason that Caffe version was used instead of NVIDIA's cuDnn.
Definition: RecurrentParameter.cs:43

MyCaffe.param.RecurrentParameter.expose_hidden_input
bool expose_hidden_input
Whether to add as additional inputs (bottoms) the initial hidden state blobss. The number of addition...
Definition: RecurrentParameter.cs:153

MyCaffe.basecode
The MyCaffe.basecode contains all generic types used throughout MyCaffe.
Definition: Annotation.cs:12

MyCaffe.param
The MyCaffe.param namespace contains parameters used to create models.
Definition: AttentionParameter.cs:9

MyCaffe
The MyCaffe namespace contains the main body of MyCaffe code that closesly tracks the C++ Caffe open-...
Definition: Annotation.cs:12

System.ComponentModel
Definition: Component.cs:11

System
Definition: Component.cs:11