mycaffe/html/_causal_self_attention_parameter_8cs_source.html

using System;

using System.Collections.Generic;

using System.Linq;

using System.Text;

using System.ComponentModel;

using MyCaffe.basecode;


namespace MyCaffe.param.gpt

{

    [Serializable]

    [TypeConverter(typeof(ExpandableObjectConverter))]

    public class CausalSelfAttentionParameter : LayerParameterBase

    {

        uint m_nHeads = 6;

        uint m_nEmbed = 192;

        double m_dfAttnDropout;

        double m_dfResidDropout;

        uint m_nBlockSize = 128;

        uint m_nLayers = 6;


        public CausalSelfAttentionParameter()

        {

        }


        [Description("Specifies number of layers (transformer blocks) used.")]

        public uint layers

        {

            get { return m_nLayers; }

            set { m_nLayers = value; }

        }


        [Description("Specifies number of heads used.")]

        public uint heads

        {

            get { return m_nHeads; }

            set { m_nHeads = value; }

        }


        public uint embed

        {

            get { return m_nEmbed; }

            set { m_nEmbed = value; }

        }


        public uint block_size

        {

            get { return m_nBlockSize; }

            set { m_nBlockSize = value; }

        }


        public double attn_dropout

        {

            get { return m_dfAttnDropout; }

            set { m_dfAttnDropout = value; }

        }


        public double resid_dropout

        {

            get { return m_dfResidDropout; }

            set { m_dfResidDropout = value; }

        }


        public override object Load(System.IO.BinaryReader br, bool bNewInstance = true)

        {

            RawProto proto = RawProto.Parse(br.ReadString());

            CausalSelfAttentionParameter p = FromProto(proto);


            if (!bNewInstance)

                Copy(p);


            return p;

        }


        public override void Copy(LayerParameterBase src)

        {

            CausalSelfAttentionParameter p = (CausalSelfAttentionParameter)src;


            m_nLayers = p.layers;

            m_nHeads = p.heads;

            m_nEmbed = p.embed;

            m_nBlockSize = p.block_size;

            m_dfAttnDropout = p.attn_dropout;

            m_dfResidDropout = p.resid_dropout;

        }


        public override LayerParameterBase Clone()

        {

            CausalSelfAttentionParameter p = new CausalSelfAttentionParameter();

            p.Copy(this);

            return p;

        }


        public override RawProto ToProto(string strName)

        {

            RawProtoCollection rgChildren = new RawProtoCollection();


            rgChildren.Add("layers", layers.ToString());

            rgChildren.Add("heads", heads.ToString());

            rgChildren.Add("embed", embed.ToString());

            rgChildren.Add("block_size", block_size.ToString());

            rgChildren.Add("attn_dropout", attn_dropout.ToString());

            rgChildren.Add("resid_dropout", resid_dropout.ToString());


            return new RawProto(strName, "", rgChildren);

        }


        public static CausalSelfAttentionParameter FromProto(RawProto rp)

        {

            string strVal;

            CausalSelfAttentionParameter p = new CausalSelfAttentionParameter();


            if ((strVal = rp.FindValue("layers")) != null)

                p.layers = uint.Parse(strVal);


            if ((strVal = rp.FindValue("heads")) != null)

                p.heads = uint.Parse(strVal);


            if ((strVal = rp.FindValue("embed")) != null)

                p.embed = uint.Parse(strVal);


            if ((strVal = rp.FindValue("block_size")) != null)

                p.block_size = uint.Parse(strVal);


            if ((strVal = rp.FindValue("attn_dropout")) != null)

                p.attn_dropout = double.Parse(strVal);


            if ((strVal = rp.FindValue("resid_dropout")) != null)

                p.resid_dropout = double.Parse(strVal);


            return p;

        }

    }

}

MyCaffe.basecode.RawProtoCollection
The RawProtoCollection class is a list of RawProto objects.
Definition: RawProtoCollection.cs:12

MyCaffe.basecode.RawProtoCollection.Add
void Add(RawProto p)
Adds a RawProto to the collection.
Definition: RawProtoCollection.cs:55

MyCaffe.basecode.RawProto
The RawProto class is used to parse and output Google prototxt file data.
Definition: RawProto.cs:17

MyCaffe.basecode.RawProto.Parse
static RawProto Parse(string str)
Parses a prototxt and places it in a new RawProto.
Definition: RawProto.cs:306

MyCaffe.basecode.RawProto.FindValue
string FindValue(string strName)
Searches for a falue of a node within this nodes children.
Definition: RawProto.cs:105

MyCaffe.param.LayerParameterBase
The LayerParameterBase is the base class for all other layer specific parameters.
Definition: LayerParameterBase.cs:18

MyCaffe.param.gpt.CausalSelfAttentionParameter
Specifies the parameters for the CausalSelfAttentionLayer.
Definition: CausalSelfAttentionParameter.cs:16

MyCaffe.param.gpt.CausalSelfAttentionParameter.ToProto
override RawProto ToProto(string strName)
Convert the parameter into a RawProto.
Definition: CausalSelfAttentionParameter.cs:123

MyCaffe.param.gpt.CausalSelfAttentionParameter.embed
uint embed
Specifies size of the embed.
Definition: CausalSelfAttentionParameter.cs:53

MyCaffe.param.gpt.CausalSelfAttentionParameter.FromProto
static CausalSelfAttentionParameter FromProto(RawProto rp)
Parses the parameter from a RawProto.
Definition: CausalSelfAttentionParameter.cs:142

MyCaffe.param.gpt.CausalSelfAttentionParameter.Copy
override void Copy(LayerParameterBase src)
Copy on parameter to another.
Definition: CausalSelfAttentionParameter.cs:98

MyCaffe.param.gpt.CausalSelfAttentionParameter.Load
override object Load(System.IO.BinaryReader br, bool bNewInstance=true)
Load the parameter from a binary reader.
Definition: CausalSelfAttentionParameter.cs:86

MyCaffe.param.gpt.CausalSelfAttentionParameter.heads
uint heads
The number of heads used.
Definition: CausalSelfAttentionParameter.cs:44

MyCaffe.param.gpt.CausalSelfAttentionParameter.block_size
uint block_size
Specifies size of the block.
Definition: CausalSelfAttentionParameter.cs:62

MyCaffe.param.gpt.CausalSelfAttentionParameter.resid_dropout
double resid_dropout
Specifies dropout probability used on the residual weights.
Definition: CausalSelfAttentionParameter.cs:80

MyCaffe.param.gpt.CausalSelfAttentionParameter.Clone
override LayerParameterBase Clone()
Creates a new copy of this instance of the parameter.
Definition: CausalSelfAttentionParameter.cs:111

MyCaffe.param.gpt.CausalSelfAttentionParameter.layers
uint layers
The number of layers (transformer blocks) used.
Definition: CausalSelfAttentionParameter.cs:34

MyCaffe.param.gpt.CausalSelfAttentionParameter.attn_dropout
double attn_dropout
Specifies dropout probability used on the attention weights.
Definition: CausalSelfAttentionParameter.cs:71

MyCaffe.param.gpt.CausalSelfAttentionParameter.CausalSelfAttentionParameter
CausalSelfAttentionParameter()
Constructor for the parameter.
Definition: CausalSelfAttentionParameter.cs:25

MyCaffe.basecode
The MyCaffe.basecode contains all generic types used throughout MyCaffe.
Definition: Annotation.cs:12

MyCaffe.param.gpt
Definition: CausalSelfAttentionParameter.cs:9

MyCaffe
The MyCaffe namespace contains the main body of MyCaffe code that closesly tracks the C++ Caffe open-...
Definition: Annotation.cs:12

System.ComponentModel
Definition: Component.cs:11

System
Definition: Component.cs:11