mycaffe/html/_embed_layer_8cs_source.html

using System;

using System.Collections.Generic;

using System.Linq;

using System.Text;

using MyCaffe.basecode;

using MyCaffe.common;

using MyCaffe.param;

using MyCaffe.fillers;

using System.Diagnostics;


namespace MyCaffe.layers

{

    public class EmbedLayer<T> : Layer<T>

    {

        int m_nM;

        int m_nK;

        int m_nN;

        bool m_bBiasTerm;

        Blob<T> m_blobBiasMultiplier;

        bool m_bWarningShown = false;

#if DEBUG

        Blob<T> m_blobWork;

#endif


        public EmbedLayer(CudaDnn<T> cuda, Log log, LayerParameter p)

            : base(cuda, log, p)

        {

            m_type = LayerParameter.LayerType.EMBED;

            m_blobBiasMultiplier = new common.Blob<T>(cuda, log);

            m_blobBiasMultiplier.Name = m_param.name + " biasmult";


#if DEBUG

            m_blobWork = new common.Blob<T>(cuda, log);

            m_blobWork.Name = m_param.name + " work";

#endif

            setup_internal_blobs(m_colInternalBlobs);

        }


        protected override void dispose()

        {

            if (m_blobBiasMultiplier != null)

            {

                m_blobBiasMultiplier.Dispose();

                m_blobBiasMultiplier = null;

            }


#if DEBUG

            if (m_blobWork != null)

            {

                m_blobWork.Dispose();

                m_blobWork = null;

            }

#endif


            base.dispose();

        }


        protected override void setup_internal_blobs(BlobCollection<T> col)

        {

            if (col.Count > 0)

                return;


            col.Add(m_blobBiasMultiplier);

        }


        public override int MinBottomBlobs

        {

            get { return 1; }

        }


        public override int MaxBottomBlobs

        {

            get { return 2; }

        }


        public override int ExactNumTopBlobs

        {

            get { return 1; }

        }


        public override bool ReInitializeParameters(WEIGHT_TARGET target)

        {

            base.ReInitializeParameters(target);


            if (target == WEIGHT_TARGET.BOTH || target == WEIGHT_TARGET.WEIGHTS)

            {

                Filler<T> weight_filler = Filler<T>.Create(m_cuda, m_log, m_param.embed_param.weight_filler);

                weight_filler.Fill(m_colBlobs[0]);

            }


            if (m_param.embed_param.bias_term && m_colBlobs.Count > 1 && (target == WEIGHT_TARGET.BOTH || target == WEIGHT_TARGET.BIAS))

            {

                Filler<T> bias_filler = Filler<T>.Create(m_cuda, m_log, m_param.embed_param.bias_filler);

                bias_filler.Fill(m_colBlobs[1]);

            }


            return true;

        }


        public override void LayerSetUp(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            m_bWarningShown = false;


            if (colBottom.Count > 1)

                m_param.embed_param.input_dim = (uint)convertF(colBottom[1].GetData(0));


            m_nN = (int)m_param.embed_param.num_output;

            m_log.CHECK_GT(m_nN, 0, "EmbedLayer num_output must be positive.");


            m_nK = (int)m_param.embed_param.input_dim;

            m_log.CHECK_GT(m_nK, 0, "EmbedLayer input_dim must be positive.");


            m_bBiasTerm = m_param.embed_param.bias_term;


            if (m_colBlobs.Count > 0)

            {

                m_log.WriteLine("Skipping parameter initialization.");

            }

            else

            {

                m_colBlobs.Clear();


                // Initialize the weights --

                // transposed from InnerProductLayer for spacial locality.

                List<int> rgWeightShape = new List<int>() { m_nK, m_nN };

                Blob<T> blobWeight = new Blob<T>(m_cuda, m_log);

                blobWeight.Name = m_param.name + " weights";

                blobWeight.type = BLOB_TYPE.WEIGHT;


                if (!shareParameter(blobWeight, rgWeightShape))

                {

                    blobWeight.Reshape(rgWeightShape);


                    // fill the weights

                    Filler<T> weight_filler = Filler<T>.Create(m_cuda, m_log, m_param.embed_param.weight_filler);

                    weight_filler.Fill(blobWeight);

                }

                m_colBlobs.Add(blobWeight);


                // If necessary, initialize and fill the bias term

                if (m_bBiasTerm)

                {

                    List<int> rgBiasShape = new List<int>() { m_nN };

                    Blob<T> blobBias = new Blob<T>(m_cuda, m_log);

                    blobBias.Name = m_param.name + " bias";

                    blobBias.type = BLOB_TYPE.WEIGHT;


                    if (!shareParameter(blobBias, rgBiasShape))

                    {

                        blobBias.Reshape(rgBiasShape);

                        Filler<T> bias_filler = Filler<T>.Create(m_cuda, m_log, m_param.embed_param.bias_filler);

                        bias_filler.Fill(blobBias);

                    }

                    m_colBlobs.Add(blobBias);

                }

            }


            m_rgbParamPropagateDown = new DictionaryMap<bool>(m_colBlobs.Count, true);

        }


        public override void Reshape(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            // Figure out the dimensions

            m_nM = colBottom[0].count();

            List<int> rgTopShape = Utility.Clone<int>(colBottom[0].shape());


            rgTopShape.Add(m_nN);

            colTop[0].Reshape(rgTopShape);


            // Set up the bias multiplier

            if (m_bBiasTerm)

            {

                List<int> rgBiasShape = new List<int>() { m_nM };

                shareLayerBlob(m_blobBiasMultiplier, rgBiasShape);

                m_blobBiasMultiplier.Reshape(rgBiasShape);

                m_blobBiasMultiplier.SetData(1.0);

            }

        }


        protected override void forward(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            long hBottomData = colBottom[0].gpu_data;

            long hTopData = colTop[0].mutable_gpu_data;

            long hWeight = m_colBlobs[0].gpu_data;

            int nCount = colTop[0].count();


#if DEBUG

            Tuple<double, double, double, double> minmax = colBottom[0].minmax_data(m_blobWork, true);

            double dfMin = minmax.Item1;

            double dfMax = minmax.Item2;

            if (dfMin < 0 || dfMax >= m_nK)

                throw new Exception("A data element within '" + colBottom[0].Name + "' is out of range [0," + m_nK.ToString() + ") non inclusive.  Data Min = " + dfMin.ToString() + " Max = " + dfMax.ToString() + ".");

#endif


            m_cuda.embed_fwd(nCount, hBottomData, hWeight, m_nM, m_nN, m_nK, hTopData);


            if (m_bBiasTerm)

                m_cuda.gemm(false, false, m_nM, m_nN, 1, 1.0, m_blobBiasMultiplier.gpu_data, m_colBlobs[1].gpu_data, 1.0, hTopData);

        }


        protected override void backward(BlobCollection<T> colTop, List<bool> rgbPropagateDown, BlobCollection<T> colBottom)

        {

            if (rgbPropagateDown[0] && !m_bWarningShown)

            {

                m_log.WriteLine("WARNING: Can't backpropagate to EmbedLayer input.");

                m_bWarningShown = true;

            }


            if (m_rgbParamPropagateDown[0])

            {

                int nTopCount = colTop[0].count();

                long hTopDiff = colTop[0].gpu_diff;

                long hBottomData = colBottom[0].gpu_data;

                long hWeightDiff = m_colBlobs[0].mutable_gpu_diff;

                m_cuda.embed_bwd(nTopCount, hBottomData, hTopDiff, m_nM, m_nN, m_nK, hWeightDiff);

            }


            if (m_bBiasTerm && m_rgbParamPropagateDown[1])

            {

                long hTopDiff = colTop[0].gpu_diff;

                long hBiasDiff = m_colBlobs[1].mutable_gpu_diff;

                m_cuda.gemv(true, m_nM, m_nN, 1.0, hTopDiff, m_blobBiasMultiplier.gpu_data, 1.0, hBiasDiff);

            }

        }

    }

}

MyCaffe.basecode.Log
The Log class provides general output in text form.
Definition: Log.cs:13

MyCaffe.basecode.Log.WriteLine
void WriteLine(string str, bool bOverrideEnabled=false, bool bHeader=false, bool bError=false, bool bDisable=false)
Write a line of output.
Definition: Log.cs:80

MyCaffe.basecode.Log.CHECK_GT
void CHECK_GT(double df1, double df2, string str)
Test whether one number is greater than another.
Definition: Log.cs:299

MyCaffe.basecode.Utility
The Utility class provides general utility funtions.
Definition: Utility.cs:35

MyCaffe.common.BlobCollection
The BlobCollection contains a list of Blobs.
Definition: BlobCollection.cs:16

MyCaffe.common.BlobCollection.Add
void Add(Blob< T > b)
Add a new Blob to the collection.
Definition: BlobCollection.cs:92

MyCaffe.common.BlobCollection.Count
int Count
Returns the number of items in the collection.
Definition: BlobCollection.cs:30

MyCaffe.common.BlobCollection.Reshape
void Reshape(int[] rgShape)
Reshapes all blobs in the collection to the given shape.
Definition: BlobCollection.cs:238

MyCaffe.common.Blob
The Blob is the main holder of data that moves through the Layers of the Net.
Definition: Blob.cs:25

MyCaffe.common.Blob.SetData
void SetData(T[] rgData, int nCount=-1, bool bSetCount=true)
Sets a number of items within the Blob's data.
Definition: Blob.cs:1922

MyCaffe.common.Blob.Blob
Blob(CudaDnn< T > cuda, Log log, bool bIncludeDiff=true, bool bUseHalfSize=false)
The Blob constructor.
Definition: Blob.cs:64

MyCaffe.common.Blob.Reshape
void Reshape(int nNum, int nChannels, int nHeight, int nWidth, bool? bUseHalfSize=null)
DEPRECIATED; use
Definition: Blob.cs:442

MyCaffe.common.Blob.type
BLOB_TYPE type
Returns the BLOB_TYPE of the Blob.
Definition: Blob.cs:2761

MyCaffe.common.Blob.Name
string Name
Get/set the name of the Blob.
Definition: Blob.cs:2184

MyCaffe.common.Blob.Dispose
virtual void Dispose(bool bDisposing)
Releases all resources used by the Blob (including both GPU and Host).
Definition: Blob.cs:402

MyCaffe.common.Blob.gpu_data
long gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1479

MyCaffe.common.CudaDnn
The CudaDnn object is the main interface to the Low-Level Cuda C++ DLL.
Definition: CudaDnn.cs:969

MyCaffe.fillers.Filler
Abstract Filler class used to fill blobs with values.
Definition: Filler.cs:19

MyCaffe.fillers.Filler.Fill
void Fill(Blob< T > b)
Fill the blob with values based on the actual filler used.
Definition: Filler.cs:50

MyCaffe.fillers.Filler.Create
static Filler< T > Create(CudaDnn< T > cuda, Log log, FillerParameter p)
Create a new Filler instance.
Definition: Filler.cs:79

MyCaffe.layers.EmbedLayer
The EmbedLayer is a layer for learning 'embeddings' of one-hot vector input. This layer is initialize...
Definition: EmbedLayer.cs:23

MyCaffe.layers.EmbedLayer.dispose
override void dispose()
Releases all GPU and host resources used by the Layer.
Definition: EmbedLayer.cs:67

MyCaffe.layers.EmbedLayer.forward
override void forward(BlobCollection< T > colBottom, BlobCollection< T > colTop)
The Forward computation.
Definition: EmbedLayer.cs:242

MyCaffe.layers.EmbedLayer.MaxBottomBlobs
override int MaxBottomBlobs
Returns the exact number of required bottom (intput) Blobs: input, input_dim.
Definition: EmbedLayer.cs:110

MyCaffe.layers.EmbedLayer.LayerSetUp
override void LayerSetUp(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Setup the layer.
Definition: EmbedLayer.cs:151

MyCaffe.layers.EmbedLayer.MinBottomBlobs
override int MinBottomBlobs
Returns the exact number of required bottom (intput) Blobs: input.
Definition: EmbedLayer.cs:99

MyCaffe.layers.EmbedLayer.setup_internal_blobs
override void setup_internal_blobs(BlobCollection< T > col)
Derivative layers should add all internal blobws to the 'col' provided.
Definition: EmbedLayer.cs:87

MyCaffe.layers.EmbedLayer.Reshape
override void Reshape(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Reshape the bottom (input) and top (output) blobs.
Definition: EmbedLayer.cs:218

MyCaffe.layers.EmbedLayer.EmbedLayer
EmbedLayer(CudaDnn< T > cuda, Log log, LayerParameter p)
The EmbedLayer constructor
Definition: EmbedLayer.cs:52

MyCaffe.layers.EmbedLayer.ExactNumTopBlobs
override int ExactNumTopBlobs
Returns the exact number of required top (output) Blobs: embed
Definition: EmbedLayer.cs:118

MyCaffe.layers.EmbedLayer.backward
override void backward(BlobCollection< T > colTop, List< bool > rgbPropagateDown, BlobCollection< T > colBottom)
Computes the error gradient w.r.t. the input.
Definition: EmbedLayer.cs:269

MyCaffe.layers.EmbedLayer.ReInitializeParameters
override bool ReInitializeParameters(WEIGHT_TARGET target)
Re-initialize the parameters of the layer.
Definition: EmbedLayer.cs:127

MyCaffe.layers.Layer
An interface for the units of computation which can be composed into a Net.
Definition: Layer.cs:31

MyCaffe.layers.Layer.m_log
Log m_log
Specifies the Log for output.
Definition: Layer.cs:43

MyCaffe.layers.Layer.m_param
LayerParameter m_param
Specifies the LayerParameter describing the Layer.
Definition: Layer.cs:47

MyCaffe.layers.Layer.shareLayerBlob
bool shareLayerBlob(Blob< T > b, List< int > rgMinShape)
Attempts to share a Layer Blob if another parameter Blob with the same name and acceptable size is fo...
Definition: Layer.cs:1170

MyCaffe.layers.Layer.shareParameter
bool shareParameter(Blob< T > b, List< int > rgMinShape, bool bAllowEndsWithComparison=false)
Attempts to share a parameter Blob if another parameter Blob with the same name and accpetable size i...
Definition: Layer.cs:1152

MyCaffe.layers.Layer.convertF
float convertF(T df)
Converts a generic to a float value.
Definition: Layer.cs:1359

MyCaffe.layers.Layer.m_colInternalBlobs
BlobCollection< T > m_colInternalBlobs
Specifies internal blobs used by the layer.
Definition: Layer.cs:59

MyCaffe.layers.Layer.m_cuda
CudaDnn< T > m_cuda
Specifies the CudaDnn connection to Cuda.
Definition: Layer.cs:39

MyCaffe.layers.Layer.m_type
LayerParameter.LayerType m_type
Specifies the Layer type.
Definition: Layer.cs:35

MyCaffe.layers.Layer.m_colBlobs
BlobCollection< T > m_colBlobs
Specifies the learnable parameter Blobs of the Layer.
Definition: Layer.cs:55

MyCaffe.layers.Layer.m_rgbParamPropagateDown
DictionaryMap< bool > m_rgbParamPropagateDown
Specifies whether or not to compute the learnable diff of each parameter Blob.
Definition: Layer.cs:63

MyCaffe.param.EmbedParameter.num_output
uint num_output
Specifies the number of outputs for the layer.
Definition: EmbedParameter.cs:33

MyCaffe.param.EmbedParameter.bias_filler
FillerParameter bias_filler
Specifies the filler for the bias.
Definition: EmbedParameter.cs:75

MyCaffe.param.EmbedParameter.weight_filler
FillerParameter weight_filler
Specifies the filler for the weights.
Definition: EmbedParameter.cs:65

MyCaffe.param.EmbedParameter.input_dim
uint input_dim
Specifies the input given as integers to be interpreted as one-hot vector indices with dimension num_...
Definition: EmbedParameter.cs:45

MyCaffe.param.EmbedParameter.bias_term
bool bias_term
Specifies whether to use a bias term or not.
Definition: EmbedParameter.cs:55

MyCaffe.param.LayerParameter
Specifies the base parameter for all layers.
Definition: LayerParameter.cs:24

MyCaffe.param.LayerParameter.name
string name
Specifies the name of this LayerParameter.
Definition: LayerParameter.cs:1865

MyCaffe.param.LayerParameter.embed_param
EmbedParameter embed_param
Returns the parameter set when initialized with LayerType.EMBED
Definition: LayerParameter.cs:2326

MyCaffe.param.LayerParameter.LayerType
LayerType
Specifies the layer type.
Definition: LayerParameter.cs:110

MyCaffe.basecode
The MyCaffe.basecode contains all generic types used throughout MyCaffe.
Definition: Annotation.cs:12

MyCaffe.common
The MyCaffe.common namespace contains common MyCaffe classes.
Definition: BatchInput.cs:8

MyCaffe.common.BLOB_TYPE
BLOB_TYPE
Defines the tpe of data held by a given Blob.
Definition: Interfaces.cs:62

MyCaffe.common.WEIGHT_TARGET
WEIGHT_TARGET
Defines the type of weight to target in re-initializations.
Definition: Interfaces.cs:38

MyCaffe.fillers
The MyCaffe.fillers namespace contains all fillers including the Filler class.
Definition: BilinearFiller.cs:10

MyCaffe.layers
The MyCaffe.layers namespace contains all layers that have a solidified code base,...
Definition: LayerFactory.cs:15

MyCaffe.param
The MyCaffe.param namespace contains parameters used to create models.
Definition: AttentionParameter.cs:9

MyCaffe
The MyCaffe namespace contains the main body of MyCaffe code that closesly tracks the C++ Caffe open-...
Definition: Annotation.cs:12

System
Definition: Component.cs:11