mycaffe/html/_attention_layer_8cs_source.html

using System;

using System.Collections.Generic;

using System.Linq;

using System.Text;

using MyCaffe.basecode;

using MyCaffe.common;

using MyCaffe.param;

using MyCaffe.fillers;

using MyCaffe.layers.beta;

using System.Diagnostics;


namespace MyCaffe.layers

{

    public class AttentionLayer<T> : Layer<T>

    {

        Layer<T> m_transposeX = null;

        Layer<T> m_transposeClip = null;

        Layer<T> m_ipUa = null;

        Layer<T> m_ipWa = null;

        Layer<T> m_tanh = null;

        Layer<T> m_add1 = null;

        Layer<T> m_ipV = null;


        Blob<T> m_blobX = null;

        Blob<T> m_blobClip = null;

        Blob<T> m_blobX1 = null;

        Blob<T> m_blobState = null;

        Blob<T> m_blobUh = null;

        Blob<T> m_blobWc = null;

        Blob<T> m_blobFullWc = null;

        Blob<T> m_blobAddOutput = null;

        Blob<T> m_blobGG = null;

        Blob<T> m_blobAA = null;

        Blob<T> m_blobScale = null;

        Blob<T> m_blobSoftmax = null;

        Blob<T> m_blobFocusedInput = null;

        Blob<T> m_blobContext = null;

        Blob<T> m_blobWork = null;


        BlobCollection<T> m_colInternalBottom = new BlobCollection<T>();

        BlobCollection<T> m_colInternalTop = new BlobCollection<T>();


        public AttentionLayer(CudaDnn<T> cuda, Log log, LayerParameter p)

            : base(cuda, log, p)

        {

            m_type = LayerParameter.LayerType.ATTENTION;


            List<int> rgDimClip = new List<int>() { 1, 0 };

            LayerParameter transposeClipparam = new LayerParameter(LayerParameter.LayerType.TRANSPOSE);

            transposeClipparam.transpose_param.dim = new List<int>(rgDimClip);


            m_transposeClip = new TransposeLayer<T>(cuda, log, transposeClipparam);


            LayerParameter ipUaParam = new LayerParameter(LayerParameter.LayerType.INNERPRODUCT);

            ipUaParam.name = "ipUa";

            ipUaParam.inner_product_param.axis = 2;

            ipUaParam.inner_product_param.num_output = m_param.attention_param.dim;

            ipUaParam.inner_product_param.weight_filler = m_param.attention_param.weight_filler;

            ipUaParam.inner_product_param.bias_filler = m_param.attention_param.bias_filler;


            if (m_param is LayerParameterEx<T>)

            {

                LayerParameterEx<T> pEx = m_param as LayerParameterEx<T>;

                ipUaParam = new LayerParameterEx<T>(ipUaParam, pEx.SharedBlobs, pEx.SharedLayerBlobs, pEx.SharedLayer);

            }


            m_ipUa = new InnerProductLayer<T>(cuda, log, ipUaParam);


            LayerParameter ipWaParam = new LayerParameter(LayerParameter.LayerType.INNERPRODUCT);

            ipWaParam.name = "ipWa";

            ipWaParam.inner_product_param.axis = 1;

            ipWaParam.inner_product_param.num_output = m_param.attention_param.dim;

            ipWaParam.inner_product_param.weight_filler = m_param.attention_param.weight_filler;

            ipWaParam.inner_product_param.bias_filler = m_param.attention_param.bias_filler;


            if (m_param is LayerParameterEx<T>)

            {

                LayerParameterEx<T> pEx = m_param as LayerParameterEx<T>;

                ipWaParam = new LayerParameterEx<T>(ipWaParam, pEx.SharedBlobs, pEx.SharedLayerBlobs, pEx.SharedLayer);

            }


            m_ipWa = new InnerProductLayer<T>(cuda, log, ipWaParam);


            LayerParameter addParam = new LayerParameter(LayerParameter.LayerType.ELTWISE);

            addParam.name = "add";

            addParam.eltwise_param.operation = EltwiseParameter.EltwiseOp.SUM;


            m_add1 = new EltwiseLayer<T>(cuda, log, addParam);


            LayerParameter tanhParam = new LayerParameter(LayerParameter.LayerType.TANH);

            tanhParam.name = "tanh";

            tanhParam.tanh_param.engine = EngineParameter.Engine.CUDNN;


            m_tanh = new TanhLayer<T>(cuda, log, tanhParam);


            LayerParameter ipVParam = new LayerParameter(LayerParameter.LayerType.INNERPRODUCT);

            ipVParam.name = "ipV";

            ipVParam.inner_product_param.axis = 2;

            ipVParam.inner_product_param.num_output = 1;

            ipVParam.inner_product_param.bias_term = false;

            ipVParam.inner_product_param.weight_filler = m_param.attention_param.weight_filler;


            if (m_param is LayerParameterEx<T>)

            {

                LayerParameterEx<T> pEx = m_param as LayerParameterEx<T>;

                ipVParam = new LayerParameterEx<T>(ipVParam, pEx.SharedBlobs, pEx.SharedLayerBlobs, pEx.SharedLayer);

            }


            m_ipV = new InnerProductLayer<T>(cuda, log, ipVParam);


            m_blobX = new Blob<T>(cuda, log);

            m_blobX.Name = m_param.name + ".x";


            m_blobClip = new Blob<T>(cuda, log);

            m_blobClip.Name = m_param.name + ".clip";


            m_blobX1 = new Blob<T>(cuda, log);

            m_blobX1.Name = m_param.name + ".x1";


            m_blobState = new Blob<T>(cuda, log);

            m_blobState.Name = m_param.name + ".state";


            m_blobUh = new Blob<T>(cuda, log);

            m_blobUh.Name = m_param.name + ".Uh";


            m_blobWc = new Blob<T>(cuda, log);

            m_blobWc.Name = m_param.name + ".Wc";


            m_blobFullWc = new Blob<T>(cuda, log);

            m_blobFullWc.Name = m_param.name + ".Full Wc";


            m_blobAddOutput = new Blob<T>(cuda, log);

            m_blobAddOutput.Name = m_param.name + ".addOut";


            m_blobGG = new Blob<T>(cuda, log);

            m_blobGG.Name = m_param.name + ".gg";


            m_blobAA = new Blob<T>(cuda, log);

            m_blobAA.Name = m_param.name + ".aa";


            m_blobScale = new Blob<T>(cuda, log, false);

            m_blobScale.Name = m_param.name + ".scale";


            m_blobSoftmax = new Blob<T>(cuda, log);

            m_blobSoftmax.Name = m_param.name + ".softmax";


            m_blobFocusedInput = new Blob<T>(cuda, log);

            m_blobFocusedInput.Name = m_param.name + ".softmax_full";


            m_blobContext = new Blob<T>(cuda, log);

            m_blobContext.Name = m_param.name + ".context";


            m_blobWork = new Blob<T>(cuda, log);

            m_blobWork.Name = m_param.name + ".work";

        }


        protected override void dispose()

        {

            dispose(ref m_transposeX);

            dispose(ref m_transposeClip);

            dispose(ref m_ipUa);

            dispose(ref m_ipWa);

            dispose(ref m_tanh);

            dispose(ref m_add1);

            dispose(ref m_ipV);


            dispose(ref m_blobState);

            dispose(ref m_blobX);

            dispose(ref m_blobClip);

            dispose(ref m_blobX1);

            dispose(ref m_blobUh);

            dispose(ref m_blobWc);

            dispose(ref m_blobFullWc);

            dispose(ref m_blobAddOutput);

            dispose(ref m_blobGG);

            dispose(ref m_blobAA);

            dispose(ref m_blobScale);

            dispose(ref m_blobSoftmax);

            dispose(ref m_blobFocusedInput);

            dispose(ref m_blobContext);

            dispose(ref m_blobWork);


            base.dispose();

        }


        protected override void setup_internal_blobs(BlobCollection<T> col)

        {

            if (col.Count > 0)

                return;


            col.Add(m_blobState);

            col.Add(m_blobUh);

            col.Add(m_blobWc);

            col.Add(m_blobFullWc);

            col.Add(m_blobAddOutput);

            col.Add(m_blobGG);

            col.Add(m_blobAA);

            col.Add(m_blobScale);

            col.Add(m_blobFocusedInput);

            col.Add(m_blobContext);

        }


        public override int ExactNumBottomBlobs

        {

            get { return 3; }

        }


        public override int ExactNumTopBlobs

        {

            get { return 1; }

        }


        public override bool ReInitializeParameters(WEIGHT_TARGET target)

        {

            base.ReInitializeParameters(target);


            m_ipUa.ReInitializeParameters(target);

            m_ipWa.ReInitializeParameters(target);


            return true;

        }


        private void addInternal(Blob<T> bottom, Blob<T> top)

        {

            m_colInternalBottom.Clear();

            m_colInternalBottom.Add(bottom);


            m_colInternalTop.Clear();

            m_colInternalTop.Add(top);

        }


        private void addInternal(List<Blob<T>> rgBottom, Blob<T> top)

        {

            m_colInternalBottom.Clear();


            for (int i=0; i<rgBottom.Count; i++)

            {

                m_colInternalBottom.Add(rgBottom[i]);

            }


            m_colInternalTop.Clear();

            m_colInternalTop.Add(top);

        }


        public override void LayerSetUp(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            Blob<T> blobX = colBottom[0];

            Blob<T> blobCy = colBottom[1];

            Blob<T> blobClip = colBottom[2];


            m_log.CHECK_EQ(blobX.shape(1), 1, "Currently, only batch size = 1 is supported.");


            m_rgbParamPropagateDown = new DictionaryMap<bool>(m_colBlobs.Count, true);


            List<int> rgDimX = new List<int>() { 1, 0 };

            while (rgDimX.Count < colBottom[0].num_axes)

            {

                rgDimX.Add(rgDimX.Count);

            }


            LayerParameter transposeXparam = new LayerParameter(LayerParameter.LayerType.TRANSPOSE);

            transposeXparam.transpose_param.dim = new List<int>(rgDimX);


            m_transposeX = new TransposeLayer<T>(m_cuda, m_log, transposeXparam);


            addInternal(blobX, m_blobX);

            m_transposeX.Setup(m_colInternalBottom, m_colInternalTop);

            m_blobX1.ReshapeLike(m_blobX);


            addInternal(m_blobX, m_blobUh);

            m_ipUa.Setup(m_colInternalBottom, m_colInternalTop);


            addInternal(blobClip, m_blobClip);

            m_transposeClip.Setup(m_colInternalBottom, m_colInternalTop);

            // Make sure the first item is set to 1.

            m_blobClip.SetData(1, 0);


            m_blobState.ReshapeLike(blobCy);


            addInternal(m_blobState, m_blobWc);

            m_ipWa.Setup(m_colInternalBottom, m_colInternalTop);


            m_blobFullWc.ReshapeLike(m_blobUh);


            addInternal(new List<Blob<T>>() { m_blobUh, m_blobFullWc }, m_blobAddOutput);

            m_add1.Setup(m_colInternalBottom, m_colInternalTop);


            addInternal(m_blobAddOutput, m_blobGG);

            m_tanh.Setup(m_colInternalBottom, m_colInternalTop);


            addInternal(m_blobGG, m_blobAA);

            m_ipV.Setup(m_colInternalBottom, m_colInternalTop);


            List<int> rgFocusShape = Utility.Clone<int>(blobX.shape());

            rgFocusShape[0] = blobX.shape(1);

            rgFocusShape[1] = blobX.shape(0);

            m_blobFocusedInput.Reshape(rgFocusShape);


            List<int> rgContextShape = Utility.Clone<int>(blobX.shape());

            rgContextShape[0] = rgContextShape[1];

            rgContextShape[1] = 1;

            m_blobContext.Reshape(rgContextShape);


            List<int> rgTopShape = Utility.Clone<int>(m_blobContext.shape());

            rgTopShape[0] = m_blobContext.shape(1);

            rgTopShape[1] = m_blobContext.shape(0);

            colTop[0].Reshape(rgTopShape);


            blobs.Clear();


            foreach (Blob<T> blob in m_ipUa.blobs)

            {

                blobs.Add(blob);

            }


            foreach (Blob<T> blob in m_ipWa.blobs)

            {

                blobs.Add(blob);

            }


            // V

            blobs.Add(m_ipV.blobs[0]);

        }


        public override void Reshape(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            if (!reshapeNeeded(colBottom, colTop))

                return;


            Blob<T> blobX = colBottom[0];

            Blob<T> blobCy = colBottom[1];

            Blob<T> blobClip = colBottom[2];


            m_log.CHECK_EQ(blobClip.count(), blobX.count(0, 2), "The bottom[2] 'clip' must have shape T,B.");


            addInternal(blobX, m_blobX);

            m_transposeX.Reshape(m_colInternalBottom, m_colInternalTop);

            m_blobX1.ReshapeLike(m_blobX);


            addInternal(m_blobX, m_blobUh);

            m_ipUa.Reshape(m_colInternalBottom, m_colInternalTop);


            addInternal(blobClip, m_blobClip);

            m_transposeClip.Reshape(m_colInternalBottom, m_colInternalTop);

            // Make sure the first item is set to 1.

            m_blobClip.SetData(1, 0);


            m_blobState.ReshapeLike(blobCy);


            addInternal(m_blobState, m_blobWc);

            m_ipWa.Reshape(m_colInternalBottom, m_colInternalTop);


            m_blobFullWc.ReshapeLike(m_blobUh);


            addInternal(new List<Blob<T>>() { m_blobUh, m_blobFullWc }, m_blobAddOutput);

            m_add1.Reshape(m_colInternalBottom, m_colInternalTop);


            addInternal(m_blobAddOutput, m_blobGG);

            m_tanh.Reshape(m_colInternalBottom, m_colInternalTop);


            addInternal(m_blobGG, m_blobAA);

            m_ipV.Reshape(m_colInternalBottom, m_colInternalTop);


            m_blobSoftmax.ReshapeLike(m_blobAA);

            m_blobScale.ReshapeLike(m_blobSoftmax);


            List<int> rgFocusShape = Utility.Clone<int>(blobX.shape());

            rgFocusShape[0] = blobX.shape(1);

            rgFocusShape[1] = blobX.shape(0);

            m_blobFocusedInput.Reshape(rgFocusShape);


            List<int> rgContextShape = Utility.Clone<int>(blobX.shape());

            rgContextShape[0] = rgContextShape[1];

            rgContextShape[1] = 1;

            m_blobContext.Reshape(rgContextShape);


            List<int> rgTopShape = Utility.Clone<int>(m_blobContext.shape());

            rgTopShape[0] = m_blobContext.shape(1);

            rgTopShape[1] = m_blobContext.shape(0);

            colTop[0].Reshape(rgTopShape);

        }


        private void apply_clip(Blob<T> blobInput, Blob<T> blobClip, Blob<T> blobOutput, bool bDiff = false)

        {

            long hSrc = (bDiff) ? blobInput.gpu_diff : blobInput.gpu_data;

            long hClip = blobClip.gpu_data;

            long hDst = (bDiff) ? blobOutput.mutable_gpu_diff : blobOutput.gpu_diff;


            m_cuda.channel_scale(blobInput.count(), blobInput.num, blobInput.channels, blobInput.count(2), hSrc, hClip, hDst);

        }


        private void softmax_fwd(Blob<T> blobBottom, Blob<T> blobClip, Blob<T> blobScale, Blob<T> blobTop, int nAxis)

        {

            int nCount = blobBottom.count();

            int nOuterNum = blobBottom.count(0, nAxis);

            int nInnerNum = blobBottom.count(nAxis + 1);

            int nChannels = blobTop.shape(nAxis);

            long hBottomData = blobBottom.gpu_data;

            long hTopData = blobTop.mutable_gpu_data;

            long hScaleData = blobScale.mutable_gpu_data;


            m_cuda.copy(nCount, hBottomData, hTopData);


            // Mask all values pass the valid ones specified in the clip, to -1 billion.

            int nValidValues = (int)convertF(blobClip.asum_data());

            if (nValidValues < nCount)

                blobTop.SetData(-1000000000.0, nValidValues, nCount - nValidValues);


            // We need to subtract the max to avoid numerical issues, compute the exp

            // and then normalize.

            // compute max.

            m_cuda.channel_max(nOuterNum * nInnerNum, nOuterNum, nChannels, nInnerNum, hTopData, hScaleData);


            // subtract

            m_cuda.channel_sub(nCount, nOuterNum, nChannels, nInnerNum, hScaleData, hTopData);


            // exponentiate

            m_cuda.exp(nCount, hTopData, hTopData);


            // Sum after exp

            m_cuda.channel_sum(nOuterNum * nInnerNum, nOuterNum, nChannels, nInnerNum, hTopData, hScaleData);


            // divide

            m_cuda.channel_div(nCount, nOuterNum, nChannels, nInnerNum, hScaleData, hTopData);


            // Denan for divide by zero.

            m_cuda.denan(nCount, blobTop.mutable_gpu_data, 0);

        }


        private void softmax_bwd(Blob<T> blobTop, Blob<T> blobClip, Blob<T> blobScale, Blob<T> blobBottom, int nAxis)

        {

            int nOuterNum = blobBottom.count(0, nAxis);

            int nInnerNum = blobBottom.count(nAxis + 1);

            long hTopDiff = blobTop.gpu_diff;

            long hTopData = blobTop.gpu_data;

            long hBottomDiff = blobBottom.mutable_gpu_diff;

            long hScaleData = m_blobScale.mutable_gpu_data;

            int nCount = blobTop.count();

            int nChannels = blobTop.shape(nAxis);


            m_cuda.copy(nCount, hTopDiff, hBottomDiff);


            // Compute inner1d(top_diff, top_data) and subtract them from the bottom diff.

            m_cuda.channel_dot(nOuterNum * nInnerNum, nOuterNum, nChannels, nInnerNum, hTopDiff, hTopData, hScaleData);

            m_cuda.channel_sub(nCount, nOuterNum, nChannels, nInnerNum, hScaleData, hBottomDiff);


            // Apply clip.

            m_cuda.channel_scale(nCount, nOuterNum, nChannels, nInnerNum, hTopData, blobClip.gpu_data, hTopData);


            // elementwise multiplication

            m_cuda.mul(nCount, hBottomDiff, hTopData, hBottomDiff);

        }


        // Move to the GPU.

        private float sum_diff(int nCount, Blob<T> b, int nOffset)

        {

            float[] rg = convertF(b.mutable_cpu_diff);

            float fSum = 0;


            for (int i = 0; i < nCount; i++)

            {

                fSum += rg[nOffset + i];

            }


            return fSum;

        }


        private void fill(Blob<T> blob1, Blob<T> blob2, Blob<T> blobFull, bool bUseDiff = false, int nBlob1AxisOffset = 0)

        {

            int nAxis = 1;

            int nM = blob1.shape(nAxis + nBlob1AxisOffset);

            int nN = blobFull.shape(nAxis);

            int nK = blob1.count(nAxis + nBlob1AxisOffset + 1);


            if (blob2 == null)

            {

                List<int> rgShape = new List<int>();

                rgShape.Add(blob1.count(0, nAxis));

                rgShape.Add(nN);

                m_blobWork.Reshape(rgShape);

                m_blobWork.SetData(1.0);

                blob2 = m_blobWork;

            }


            if (bUseDiff)

                m_cuda.gemm(true, true, nM, nN, nK, 1.0, blob1.gpu_diff, blob2.gpu_data, 0.0, blobFull.mutable_gpu_diff);

            else

                m_cuda.gemm(true, false, nM, nN, nK, 1.0, blob1.gpu_data, blob2.gpu_data, 0.0, blobFull.mutable_gpu_data);


            // Transpose result.

            m_blobWork.ReshapeLike(blobFull);


            if (bUseDiff)

            {

                m_cuda.geam(true, false, nM, nN, 1.0, blobFull.gpu_diff, blobFull.gpu_diff, 0.0, m_blobWork.mutable_gpu_data);

                m_cuda.copy(m_blobWork.count(), m_blobWork.gpu_data, blobFull.mutable_gpu_diff);

            }

            else

            {

                m_cuda.geam(true, false, nM, nN, 1.0, blobFull.gpu_data, blobFull.gpu_data, 0.0, m_blobWork.mutable_gpu_data);

                m_cuda.copy(m_blobWork.count(), m_blobWork.gpu_data, blobFull.mutable_gpu_data);

            }

        }


        protected override void forward(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            Blob<T> blobX = colBottom[0];

            Blob<T> blobCy = colBottom[1];

            Blob<T> blobClip = colBottom[2];


            // Force values to 1 or 0.

            m_cuda.sign(blobClip.count(), blobClip.gpu_data, blobClip.mutable_gpu_data);


            addInternal(blobX, m_blobX);

            m_transposeX.Forward(m_colInternalBottom, m_colInternalTop);


            addInternal(blobClip, m_blobClip);

            m_transposeClip.Forward(m_colInternalBottom, m_colInternalTop);

            // Make sure the first item is set to 1.

            m_blobClip.SetData(1, 0);


            // Apply the clip.

            apply_clip(m_blobX, blobClip, m_blobX);


            // No need to transpose for state T = 1.

            m_cuda.copy(blobCy.count(), blobCy.gpu_data, m_blobState.mutable_gpu_data);


            addInternal(m_blobX, m_blobUh);

            m_ipUa.Forward(m_colInternalBottom, m_colInternalTop);


            addInternal(m_blobState, m_blobWc);

            m_ipWa.Forward(m_colInternalBottom, m_colInternalTop);


            // Duplicate Wc across all T.

            fill(m_blobWc, null, m_blobFullWc);


            addInternal(new List<Blob<T>>() { m_blobUh, m_blobFullWc }, m_blobAddOutput);

            m_add1.Forward(m_colInternalBottom, m_colInternalTop);


            addInternal(m_blobAddOutput, m_blobGG);

            m_tanh.Forward(m_colInternalBottom, m_colInternalTop);


            addInternal(m_blobGG, m_blobAA);

            m_ipV.Forward(m_colInternalBottom, m_colInternalTop);


            softmax_fwd(m_blobAA, m_blobClip, m_blobScale, m_blobSoftmax, 1);


            // Apply softmax to each channel

            m_blobFocusedInput.CopyFrom(m_blobX);

            m_blobContext.SetData(0);

            int nCount = m_blobFocusedInput.count(2);

            int nOuterNum = m_blobFocusedInput.count(0, 2);

            // Scale by softmax and sum.

            m_cuda.gemv(true, nOuterNum, nCount, 1.0, m_blobFocusedInput.gpu_data, m_blobSoftmax.gpu_data, 0.0, m_blobContext.mutable_gpu_data);


            // Reshape not needed for T = 1 in topT and top(0)

            m_cuda.copy(m_blobContext.count(), m_blobContext.gpu_data, colTop[0].mutable_gpu_data);

        }


        protected override void backward(BlobCollection<T> colTop, List<bool> rgbPropagateDown, BlobCollection<T> colBottom)

        {

            // Gradient with respect to state then data.

            if (rgbPropagateDown[0])

            {

                Blob<T> blobX = colBottom[0];

                Blob<T> blobCy = colBottom[1];

                Blob<T> blobClip = colBottom[2];


                m_blobGG.SetDiff(0);

                m_blobAA.SetDiff(0);

                m_blobAddOutput.SetDiff(0);

                m_blobUh.SetDiff(0);

                m_blobFullWc.SetDiff(0);

                m_blobWc.SetDiff(0);

                m_blobScale.SetDiff(0);


                List<bool> rgbPropagate = new List<bool>() { true, true };


                // Reshape not needed for T = 1 in topT and top(0)

                m_cuda.copy(colTop[0].count(), colTop[0].gpu_data, m_blobContext.mutable_gpu_data);

                m_cuda.copy(colTop[0].count(), colTop[0].gpu_diff, m_blobContext.mutable_gpu_diff);


                // Apply gradient w.r.t input. (x = context x softmax)

                fill(m_blobContext, m_blobSoftmax, m_blobX1, true, 1);


                // Apply gradient w.r.t softmax.

                m_cuda.channel_mulv(m_blobX.count(), m_blobX.num, m_blobX.channels, m_blobX.count(2), m_blobX.gpu_data, m_blobContext.gpu_diff, m_blobFocusedInput.mutable_gpu_diff);

                m_cuda.channel_sum(m_blobX.count(), m_blobX.count(0, 2), m_blobX.shape(2), m_blobX.count(3), m_blobFocusedInput.gpu_diff, m_blobSoftmax.mutable_gpu_diff);


                softmax_bwd(m_blobSoftmax, m_blobClip, m_blobScale, m_blobAA, 1);


                addInternal(m_blobGG, m_blobAA);

                m_ipV.Backward(m_colInternalTop, rgbPropagate, m_colInternalBottom);


                addInternal(m_blobAddOutput, m_blobGG);

                m_tanh.Backward(m_colInternalTop, rgbPropagate, m_colInternalBottom);


                addInternal(new List<Blob<T>>() { m_blobUh, m_blobFullWc }, m_blobAddOutput);

                m_add1.Backward(m_colInternalTop, rgbPropagate, m_colInternalBottom);


                // Sum weights by channel.

                m_cuda.channel_sum(m_blobFullWc.count(), m_blobFullWc.num, m_blobFullWc.channels, m_blobWc.count(), m_blobFullWc.gpu_diff, m_blobWc.mutable_gpu_diff);


                addInternal(m_blobState, m_blobWc);

                m_ipWa.Backward(m_colInternalTop, rgbPropagate, m_colInternalBottom);


                addInternal(m_blobX, m_blobUh);

                m_ipUa.Backward(m_colInternalTop, rgbPropagate, m_colInternalBottom);

                m_cuda.add(m_blobX.count(), m_blobX1.gpu_diff, m_blobX.gpu_diff, m_blobX.mutable_gpu_diff);


                // No need to transpose for state T = 1.

                m_cuda.copy(blobCy.count(), m_blobState.gpu_diff, blobCy.mutable_gpu_diff);


                addInternal(blobX, m_blobX);

                m_transposeX.Backward(m_colInternalTop, rgbPropagate, m_colInternalBottom);

            }

        }

    }

}

MyCaffe.basecode.Log
The Log class provides general output in text form.
Definition: Log.cs:13

MyCaffe.basecode.Log.CHECK_EQ
void CHECK_EQ(double df1, double df2, string str)
Test whether one number is equal to another.
Definition: Log.cs:239

MyCaffe.basecode.Utility
The Utility class provides general utility funtions.
Definition: Utility.cs:35

MyCaffe.common.BlobCollection
The BlobCollection contains a list of Blobs.
Definition: BlobCollection.cs:16

MyCaffe.common.BlobCollection.Add
void Add(Blob< T > b)
Add a new Blob to the collection.
Definition: BlobCollection.cs:92

MyCaffe.common.BlobCollection.Count
int Count
Returns the number of items in the collection.
Definition: BlobCollection.cs:30

MyCaffe.common.BlobCollection.Clear
void Clear(bool bDispose=false)
Remove all items from the collection.
Definition: BlobCollection.cs:135

MyCaffe.common.BlobCollection.Reshape
void Reshape(int[] rgShape)
Reshapes all blobs in the collection to the given shape.
Definition: BlobCollection.cs:238

MyCaffe.common.Blob
The Blob is the main holder of data that moves through the Layers of the Net.
Definition: Blob.cs:25

MyCaffe.common.Blob.channels
int channels
DEPRECIATED; legacy shape accessor channels: use shape(1) instead.
Definition: Blob.cs:800

MyCaffe.common.Blob.SetData
void SetData(T[] rgData, int nCount=-1, bool bSetCount=true)
Sets a number of items within the Blob's data.
Definition: Blob.cs:1922

MyCaffe.common.Blob.mutable_gpu_diff
long mutable_gpu_diff
Returns the diff GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1555

MyCaffe.common.Blob.mutable_cpu_diff
T[] mutable_cpu_diff
Get diff from the GPU and bring it over to the host, or Set diff from the Host and send it over to th...
Definition: Blob.cs:1511

MyCaffe.common.Blob.mutable_gpu_data
long mutable_gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1487

MyCaffe.common.Blob.Reshape
void Reshape(int nNum, int nChannels, int nHeight, int nWidth, bool? bUseHalfSize=null)
DEPRECIATED; use
Definition: Blob.cs:442

MyCaffe.common.Blob.CopyFrom
void CopyFrom(Blob< T > src, int nSrcOffset, int nDstOffset, int nCount, bool bCopyData, bool bCopyDiff)
Copy from a source Blob.
Definition: Blob.cs:903

MyCaffe.common.Blob.shape
List< int > shape()
Returns an array where each element contains the shape of an axis of the Blob.
Definition: Blob.cs:684

MyCaffe.common.Blob.asum_data
T asum_data()
Compute the sum of absolute values (L1 norm) of the data.
Definition: Blob.cs:1706

MyCaffe.common.Blob.count
int count()
Returns the total number of items in the Blob.
Definition: Blob.cs:739

MyCaffe.common.Blob.ReshapeLike
void ReshapeLike(Blob< T > b, bool? bUseHalfSize=null)
Reshape this Blob to have the same shape as another Blob.
Definition: Blob.cs:648

MyCaffe.common.Blob.Name
string Name
Get/set the name of the Blob.
Definition: Blob.cs:2184

MyCaffe.common.Blob.gpu_diff
long gpu_diff
Returns the diff GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1541

MyCaffe.common.Blob.SetDiff
void SetDiff(double dfVal, int nIdx=-1)
Either sets all of the diff items in the Blob to a given value, or alternatively only sets a single i...
Definition: Blob.cs:1981

MyCaffe.common.Blob.num
int num
DEPRECIATED; legacy shape accessor num: use shape(0) instead.
Definition: Blob.cs:792

MyCaffe.common.Blob.gpu_data
long gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1479

MyCaffe.common.CudaDnn
The CudaDnn object is the main interface to the Low-Level Cuda C++ DLL.
Definition: CudaDnn.cs:969

MyCaffe.layers.AttentionLayer
[DEPRECIATED] The AttentionLayer provides focus for LSTM based encoder/decoder models.
Definition: AttentionLayer.cs:31

MyCaffe.layers.AttentionLayer.AttentionLayer
AttentionLayer(CudaDnn< T > cuda, Log log, LayerParameter p)
The AttentionLayer constructor.
Definition: AttentionLayer.cs:66

MyCaffe.layers.AttentionLayer.setup_internal_blobs
override void setup_internal_blobs(BlobCollection< T > col)
Derivative layers should add all internal blobws to the 'col' provided.
Definition: AttentionLayer.cs:211

MyCaffe.layers.AttentionLayer.backward
override void backward(BlobCollection< T > colTop, List< bool > rgbPropagateDown, BlobCollection< T > colBottom)
Computes the loss error gradient w.r.t the outputs.
Definition: AttentionLayer.cs:628

MyCaffe.layers.AttentionLayer.forward
override void forward(BlobCollection< T > colBottom, BlobCollection< T > colTop)
The forward computation.
Definition: AttentionLayer.cs:562

MyCaffe.layers.AttentionLayer.ReInitializeParameters
override bool ReInitializeParameters(WEIGHT_TARGET target)
Re-initialize the parameters of the layer.
Definition: AttentionLayer.cs:249

MyCaffe.layers.AttentionLayer.ExactNumTopBlobs
override int ExactNumTopBlobs
Returns the exact number of required top (output) Blobs: ip
Definition: AttentionLayer.cs:240

MyCaffe.layers.AttentionLayer.LayerSetUp
override void LayerSetUp(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Setup the layer.
Definition: AttentionLayer.cs:286

MyCaffe.layers.AttentionLayer.Reshape
override void Reshape(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Reshape the bottom (input) and top (output) blobs.
Definition: AttentionLayer.cs:371

MyCaffe.layers.AttentionLayer.dispose
override void dispose()
Releases all GPU and host resources used by the Layer.
Definition: AttentionLayer.cs:181

MyCaffe.layers.AttentionLayer.ExactNumBottomBlobs
override int ExactNumBottomBlobs
Returns the exact number of required bottom (input) Blobs: input, state (last ct),...
Definition: AttentionLayer.cs:232

MyCaffe.layers.EltwiseLayer
The EltwiseLayer computes elementwise oeprations, such as product and sum, along multiple input blobs...
Definition: EltwiseLayer.cs:23

MyCaffe.layers.InnerProductLayer
The InnerProductLayer, also know as a 'fully-connected' layer, computes the inner product with a set ...
Definition: InnerProductLayer.cs:22

MyCaffe.layers.Layer
An interface for the units of computation which can be composed into a Net.
Definition: Layer.cs:31

MyCaffe.layers.Layer.m_log
Log m_log
Specifies the Log for output.
Definition: Layer.cs:43

MyCaffe.layers.Layer.m_param
LayerParameter m_param
Specifies the LayerParameter describing the Layer.
Definition: Layer.cs:47

MyCaffe.layers.Layer.Backward
void Backward(BlobCollection< T > colTop, List< bool > rgbPropagateDown, BlobCollection< T > colBottom)
Given the top Blob error gradients, compute the bottom Blob error gradients.
Definition: Layer.cs:815

MyCaffe.layers.Layer.ReInitializeParameters
virtual bool ReInitializeParameters(WEIGHT_TARGET target)
Re-initialize the parameters of the layer.
Definition: Layer.cs:389

MyCaffe.layers.Layer.Forward
double Forward(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Given the bottom (input) Blobs, this function computes the top (output) Blobs and the loss.
Definition: Layer.cs:728

MyCaffe.layers.Layer.convertF
float convertF(T df)
Converts a generic to a float value.
Definition: Layer.cs:1359

MyCaffe.layers.Layer.Reshape
abstract void Reshape(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Adjust the shapes of top blobs and internal buffers to accomodate the shapes of the bottom blobs.

MyCaffe.layers.Layer.reshapeNeeded
virtual bool reshapeNeeded(BlobCollection< T > colBottom, BlobCollection< T > colTop, bool bReset=true)
Tests the shapes of both the bottom and top blobs and if they are the same as the previous sizing,...
Definition: Layer.cs:622

MyCaffe.layers.Layer.m_cuda
CudaDnn< T > m_cuda
Specifies the CudaDnn connection to Cuda.
Definition: Layer.cs:39

MyCaffe.layers.Layer.Setup
void Setup(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Implements common Layer setup functionality.
Definition: Layer.cs:439

MyCaffe.layers.Layer.m_type
LayerParameter.LayerType m_type
Specifies the Layer type.
Definition: Layer.cs:35

MyCaffe.layers.Layer.blobs
BlobCollection< T > blobs
Returns the collection of learnable parameter Blobs for the Layer.
Definition: Layer.cs:875

MyCaffe.layers.Layer.m_colBlobs
BlobCollection< T > m_colBlobs
Specifies the learnable parameter Blobs of the Layer.
Definition: Layer.cs:55

MyCaffe.layers.Layer.m_rgbParamPropagateDown
DictionaryMap< bool > m_rgbParamPropagateDown
Specifies whether or not to compute the learnable diff of each parameter Blob.
Definition: Layer.cs:63

MyCaffe.layers.LayerParameterEx
The LayerParameterEx class is used when sharing another Net to conserve GPU memory and extends the La...
Definition: Layer.cs:1750

MyCaffe.layers.LayerParameterEx.SharedBlobs
BlobCollection< T > SharedBlobs
Returns the shared parameter Blobs.
Definition: Layer.cs:1782

MyCaffe.layers.LayerParameterEx.SharedLayer
Layer< T > SharedLayer
Returns the layer in the shared Net that matches this one.
Definition: Layer.cs:1774

MyCaffe.layers.LayerParameterEx.SharedLayerBlobs
BlobCollection< T > SharedLayerBlobs
Returns the shared Layer Blobs.
Definition: Layer.cs:1790

MyCaffe.layers.TanhLayer
The TanhLayer is a neuron layer that calculates the tanh function, popular with auto-encoders....
Definition: TanhLayer.cs:28

MyCaffe.layers.beta.TransposeLayer
The TransposeLayer performs a permute and transpose operation similar to numpy.transpose.
Definition: TransposeLayer.cs:20

MyCaffe.param.AttentionParameter.bias_filler
FillerParameter bias_filler
The filler for the bias.
Definition: AttentionParameter.cs:67

MyCaffe.param.AttentionParameter.weight_filler
FillerParameter weight_filler
The filler for the weights.
Definition: AttentionParameter.cs:56

MyCaffe.param.AttentionParameter.dim
uint dim
Specifies the dim of the attention unit which should match the LSTM output size.
Definition: AttentionParameter.cs:45

MyCaffe.param.EltwiseParameter
Specifies the parameters for the EltwiseLayer.
Definition: EltwiseParameter.cs:22

MyCaffe.param.EltwiseParameter.EltwiseOp
EltwiseOp
Defines the operation to perform.
Definition: EltwiseParameter.cs:27

MyCaffe.param.EltwiseParameter.operation
EltwiseOp operation
Specifies the element-wise operation.
Definition: EltwiseParameter.cs:70

MyCaffe.param.EngineParameter
Specifies whether to use the NVIDIA cuDnn version or Caffe version of a given forward/backward operat...
Definition: EngineParameter.cs:17

MyCaffe.param.EngineParameter.engine
Engine engine
Specifies the Engine in use.
Definition: EngineParameter.cs:49

MyCaffe.param.EngineParameter.Engine
Engine
Defines the type of engine to use.
Definition: EngineParameter.cs:24

MyCaffe.param.InnerProductParameter.weight_filler
FillerParameter weight_filler
The filler for the weights.
Definition: InnerProductParameter.cs:119

MyCaffe.param.InnerProductParameter.axis
int axis
Specifies the first axis to be lumped into a single inner product computation; all preceding axes are...
Definition: InnerProductParameter.cs:142

MyCaffe.param.InnerProductParameter.bias_filler
FillerParameter bias_filler
The filler for the bias.
Definition: InnerProductParameter.cs:130

MyCaffe.param.InnerProductParameter.num_output
uint num_output
The number of outputs for the layer.
Definition: InnerProductParameter.cs:85

MyCaffe.param.InnerProductParameter.bias_term
bool bias_term
Whether to have bias terms or not.
Definition: InnerProductParameter.cs:108

MyCaffe.param.LayerParameter
Specifies the base parameter for all layers.
Definition: LayerParameter.cs:24

MyCaffe.param.LayerParameter.name
string name
Specifies the name of this LayerParameter.
Definition: LayerParameter.cs:1865

MyCaffe.param.LayerParameter.eltwise_param
EltwiseParameter eltwise_param
Returns the parameter set when initialized with LayerType.ELTWISE
Definition: LayerParameter.cs:2308

MyCaffe.param.LayerParameter.inner_product_param
InnerProductParameter inner_product_param
Returns the parameter set when initialized with LayerType.INNERPRODUCT
Definition: LayerParameter.cs:2452

MyCaffe.param.LayerParameter.transpose_param
TransposeParameter transpose_param
Returns the parameter set when initialized with LayerType.TRANSPOSE
Definition: LayerParameter.cs:2876

MyCaffe.param.LayerParameter.attention_param
AttentionParameter attention_param
Returns the parameter set when initialized with LayerType.ATTENTION
Definition: LayerParameter.cs:2172

MyCaffe.param.LayerParameter.LayerType
LayerType
Specifies the layer type.
Definition: LayerParameter.cs:110

MyCaffe.param.LayerParameter.tanh_param
TanhParameter tanh_param
Returns the parameter set when initialized with LayerType.TANH
Definition: LayerParameter.cs:2831

MyCaffe.basecode
The MyCaffe.basecode contains all generic types used throughout MyCaffe.
Definition: Annotation.cs:12

MyCaffe.common
The MyCaffe.common namespace contains common MyCaffe classes.
Definition: BatchInput.cs:8

MyCaffe.common.WEIGHT_TARGET
WEIGHT_TARGET
Defines the type of weight to target in re-initializations.
Definition: Interfaces.cs:38

MyCaffe.fillers
The MyCaffe.fillers namespace contains all fillers including the Filler class.
Definition: BilinearFiller.cs:10

MyCaffe.layers.beta
The MyCaffe.layers.beta namespace contains all beta stage layers.
Definition: LayerFactory.cs:9

MyCaffe.layers
The MyCaffe.layers namespace contains all layers that have a solidified code base,...
Definition: LayerFactory.cs:15

MyCaffe.param
The MyCaffe.param namespace contains parameters used to create models.
Definition: AttentionParameter.cs:9

MyCaffe
The MyCaffe namespace contains the main body of MyCaffe code that closesly tracks the C++ Caffe open-...
Definition: Annotation.cs:12

System
Definition: Component.cs:11