mycaffe/html/_cfc_layer_8cs_source.html

using System;

using System.Collections.Generic;

using System.Diagnostics;

using System.Linq;

using System.Runtime.InteropServices;

using System.Text;

using MyCaffe.basecode;

using MyCaffe.common;

using MyCaffe.param;

using MyCaffe.param.lnn;


namespace MyCaffe.layers.lnn

{

    public class CfcLayer<T> : Layer<T>

    {

        int m_nBatchSize;

        int m_nSeqLen;

        int m_nTrueInFeatures;

        int m_nReshapeCount = 0;

        int m_nMaskCount;

        BlobCollection<T> m_colTop = new BlobCollection<T>();

        BlobCollection<T> m_colBtm = new BlobCollection<T>();

        Layer<T> m_rnn_cell = null;

        Layer<T> m_cat = null;

        Layer<T> m_fc = null;

        Blob<T> m_blobInputs1 = null;

        Blob<T> m_blobInputs = null;

        Blob<T> m_blobHState1 = null;

        Blob<T> m_blobHState = null;

        BlobCollection<T> m_rgBlobHState = new BlobCollection<T>();


        List<BlobCollection<T>> m_rgrgInternalBlobs = new List<BlobCollection<T>>();


        Blob<T> m_blobTs = null;

        Blob<T> m_blobTsFull = null;

        Blob<T> m_blobForwardInput = null;

        Blob<T> m_blobForwardInput1 = null;

        Blob<T> m_blobForwardInput2 = null;

        Blob<T> m_blobForwardOutput = null;

        Blob<T> m_blobForwardOutput1 = null;

        Blob<T> m_blobForwardOutput2 = null;

        Blob<T> m_blobTimeSinceUpdate = null;

        Blob<T> m_blobTimeSinceUpdate1 = null;

        Blob<T> m_blobMask = null;

        Blob<T> m_blobMaskInv = null;

        Blob<T> m_blobCurrentMask = null;

        Blob<T> m_blobCurrentMaskFull = null;

        Blob<T> m_blobCurrentOutput = null;

        Blob<T> m_blobOutputSequence = null;

        int[] m_rgShape = new int[] { 1, 1, 1, 1 };

        bool m_bSetup = false;

        int m_nHiddenSize = 0;


        public CfcLayer(CudaDnn<T> cuda, Log log, LayerParameter p)

            : base(cuda, log, p)

        {

            m_type = LayerParameter.LayerType.CFC;


            if (p.cfc_param.cell_type == CfcParameter.CELL_TYPE.LTC)

                m_nHiddenSize = p.ltc_unit_param.hidden_size;

            else

                m_nHiddenSize = p.cfc_unit_param.hidden_size;


            m_blobHState1 = new Blob<T>(m_cuda, m_log);

            m_blobHState = new Blob<T>(m_cuda, m_log);


            m_blobTs = new Blob<T>(m_cuda, m_log);


            m_blobInputs = new Blob<T>(m_cuda, m_log);

            m_blobInputs1 = new Blob<T>(m_cuda, m_log);

            m_blobMask = new Blob<T>(m_cuda, m_log);

            m_blobMaskInv = new Blob<T>(m_cuda, m_log);


            m_blobCurrentMask = new Blob<T>(m_cuda, m_log);

            m_blobCurrentOutput = new Blob<T>(m_cuda, m_log);

            m_blobCurrentMaskFull = new Blob<T>(m_cuda, m_log);


            m_blobForwardInput = new Blob<T>(m_cuda, m_log);

            m_blobForwardInput1 = new Blob<T>(m_cuda, m_log);

            m_blobForwardInput2 = new Blob<T>(m_cuda, m_log);

            m_blobTimeSinceUpdate = new Blob<T>(m_cuda, m_log);

            m_blobTimeSinceUpdate1 = new Blob<T>(m_cuda, m_log);

            m_blobTsFull = new Blob<T>(m_cuda, m_log);


            m_blobForwardOutput = new Blob<T>(m_cuda, m_log);

            m_blobForwardOutput1 = new Blob<T>(m_cuda, m_log);

            m_blobForwardOutput2 = new Blob<T>(m_cuda, m_log);


            m_blobOutputSequence = new Blob<T>(m_cuda, m_log);


            LayerParameter cat = new LayerParameter(LayerParameter.LayerType.CONCAT);

            cat.concat_param.axis = 1;

            m_cat = Layer<T>.Create(m_cuda, m_log, convertLayerParam(cat, p), null);


            LayerParameter rnn = null;


            if (m_param.cfc_param.cell_type == CfcParameter.CELL_TYPE.LTC)

            {

                rnn = new LayerParameter(LayerParameter.LayerType.LTC_UNIT);

                rnn.ltc_unit_param.Copy(m_param.ltc_unit_param);

            }

            else

            {

                rnn = new LayerParameter(LayerParameter.LayerType.CFC_UNIT);

                rnn.cfc_unit_param.Copy(m_param.cfc_unit_param);

            }


            m_rnn_cell = Layer<T>.Create(m_cuda, m_log, convertLayerParam(rnn, p), null);


            LayerParameter fc = new LayerParameter(LayerParameter.LayerType.INNERPRODUCT, "fc");

            fc.inner_product_param.num_output = (uint)m_param.cfc_param.output_features;

            fc.inner_product_param.bias_term = true;

            fc.inner_product_param.weight_filler = new FillerParameter("xavier");

            fc.inner_product_param.bias_filler = new FillerParameter("constant", 0.1);

            fc.inner_product_param.axis = 1;

            m_fc = Layer<T>.Create(m_cuda, m_log, convertLayerParam(fc, p), null);

        }


        private void dispose(ref List<BlobCollection<T>> rg)

        {

            if (rg == null)

                return;


            for (int i = 0; i < rg.Count; i++)

            {

                for (int j = 0; j < rg[i].Count; j++)

                {

                    if (rg[i][j] != null)

                        rg[i][j].Dispose();

                }

            }

            rg.Clear();

            rg = null;

        }


        protected override void dispose()

        {

            base.dispose();


            dispose(ref m_rgBlobHState);


            dispose(ref m_rgrgInternalBlobs);


            dispose(ref m_blobHState1);

            dispose(ref m_blobHState);

            dispose(ref m_blobInputs1);

            dispose(ref m_blobInputs);

            dispose(ref m_blobTs);

            dispose(ref m_blobTsFull);

            dispose(ref m_blobForwardInput);

            dispose(ref m_blobForwardInput1);

            dispose(ref m_blobForwardInput2);

            dispose(ref m_blobForwardOutput);

            dispose(ref m_blobForwardOutput1);

            dispose(ref m_blobForwardOutput2);

            dispose(ref m_blobTimeSinceUpdate);

            dispose(ref m_blobTimeSinceUpdate1);

            dispose(ref m_blobMask);

            dispose(ref m_blobMaskInv);

            dispose(ref m_blobCurrentMask);

            dispose(ref m_blobCurrentMaskFull);

            dispose(ref m_blobCurrentOutput);

            dispose(ref m_blobOutputSequence);


            dispose(ref m_rnn_cell);

            dispose(ref m_cat);

            dispose(ref m_fc);

        }


        private void addBtmTop(Blob<T> btm, Blob<T> top)

        {

            m_colBtm.Clear();

            m_colBtm.Add(btm);

            m_colTop.Clear();

            m_colTop.Add(top);

        }


        protected override void setup_internal_blobs(BlobCollection<T> col)

        {

            if (col.Count > 0)

                return;

        }


        public override int ExactNumBottomBlobs

        {

            get { return 3; }

        }


        public override int ExactNumTopBlobs

        {

            get { return 1; }

        }


        public override bool ReInitializeParameters(WEIGHT_TARGET target)

        {

            base.ReInitializeParameters(target);

            return true;

        }


        public override void LayerSetUp(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            if (m_bSetup)

                return;


            m_nBatchSize = colBottom[0].num;

            m_nSeqLen = colBottom[0].channels;

            m_nTrueInFeatures = colBottom[0].count(2);

            m_nReshapeCount = 0;


            m_rgShape[0] = m_nBatchSize;

            m_rgShape[1] = m_nHiddenSize;

            m_blobHState1.Reshape(m_rgShape);

            m_blobHState.Reshape(m_rgShape);


            for (int i = 0; i < m_nSeqLen; i++)

            {

                Blob<T> blobHStateT = new Blob<T>(m_cuda, m_log, m_rgShape);

                blobHStateT.Name = "h_state_" + i.ToString();

                m_rgBlobHState.Add(blobHStateT);


                BlobCollection<T> col = ((LnnUnitLayer<T>)m_rnn_cell).CreateInternalSharedBlobs(i, m_cuda, m_log);

                m_rgrgInternalBlobs.Add(col);

            }


            m_rgShape[1] = 1;

            m_blobTs.Reshape(m_rgShape);


            m_rgShape[1] = m_nTrueInFeatures;

            m_blobInputs.Reshape(m_rgShape);

            m_blobMask.ReshapeLike(m_blobInputs);

            m_blobMaskInv.ReshapeLike(m_blobInputs);

            m_nMaskCount = m_blobMask.count(2);


            m_rgShape[1] = 1;

            m_blobCurrentMask.Reshape(m_rgShape);


            m_rgShape[1] = m_nTrueInFeatures;

            m_blobForwardInput.Reshape(m_rgShape);

            m_blobForwardInput1.Reshape(m_rgShape);

            m_blobForwardInput2.Reshape(m_rgShape);

            m_blobTimeSinceUpdate.Reshape(m_rgShape);

            m_blobTimeSinceUpdate1.Reshape(m_rgShape);

            m_blobTsFull.Reshape(m_rgShape);


            m_rgShape[1] = m_param.cfc_param.output_features;

            m_blobForwardOutput.Reshape(m_rgShape);

            m_blobForwardOutput1.Reshape(m_rgShape);

            m_blobForwardOutput2.Reshape(m_rgShape);


            addBtmTop(m_blobForwardInput, m_blobInputs1);

            if (m_nTrueInFeatures * 2 < m_param.cfc_param.input_features && m_nMaskCount == m_nTrueInFeatures)

                m_colBtm.Add(m_blobTimeSinceUpdate);

            m_colBtm.Add(m_blobMask);

            m_cat.Setup(m_colBtm, m_colTop);


            ((LnnUnitLayer<T>)m_rnn_cell).SetInternalSharedBlobs(m_rgrgInternalBlobs[0]);


            addBtmTop(m_blobInputs1, m_blobHState);

            m_colBtm.Add(m_blobHState1);

            m_colBtm.Add(m_blobTs);

            m_rnn_cell.Setup(m_colBtm, m_colTop);

            blobs.Add(m_rnn_cell.blobs);


            m_blobHState.Unsqueeze(4);


            addBtmTop(m_blobHState, m_blobCurrentOutput);

            m_fc.Setup(m_colBtm, m_colTop);

            blobs.Add(m_fc.blobs);


            m_blobCurrentMaskFull.ReshapeLike(m_blobCurrentOutput);


            addBtmTop(m_blobHState, colTop[0]);

            m_fc.Reshape(m_colBtm, m_colTop);


            m_bSetup = true;

        }


        public override void Reshape(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            int nTrueInFeatures = (int)colBottom[0].count(2);


            // Only reshape when needed.

            if (m_nReshapeCount > 0 &&

                m_nBatchSize > 0 && m_nBatchSize == colBottom[0].num &&

                m_nSeqLen > 0 && m_nSeqLen == colBottom[0].channels &&

                m_nTrueInFeatures > 0 && m_nTrueInFeatures == nTrueInFeatures)

                return;


            m_nReshapeCount++;

            m_nBatchSize = colBottom[0].num;

            m_nSeqLen = colBottom[0].channels;

            m_nTrueInFeatures = nTrueInFeatures;


            m_rgShape[0] = m_nBatchSize;

            m_rgShape[1] = m_nHiddenSize;


            m_blobHState1.Reshape(m_rgShape);

            m_blobHState.Reshape(m_rgShape);


            for (int i=0; i<m_nSeqLen; i++)

            {

                m_rgBlobHState[i].Reshape(m_rgShape);

            }


            m_rgShape[1] = 1;

            m_blobTs.Reshape(m_rgShape);


            m_rgShape[1] = m_nTrueInFeatures;

            m_blobInputs.Reshape(m_rgShape);

            m_blobMask.ReshapeLike(m_blobInputs);

            m_blobMaskInv.ReshapeLike(m_blobInputs);

            m_blobMaskInv.SetDiff(1.0);

            m_nMaskCount = m_blobMask.count(2);


            m_rgShape[1] = 1;

            m_blobCurrentMask.Reshape(m_rgShape);


            m_rgShape[1] = m_nTrueInFeatures;

            m_blobForwardInput.Reshape(m_rgShape);

            m_blobForwardInput1.Reshape(m_rgShape);

            m_blobForwardInput2.Reshape(m_rgShape);

            m_blobTimeSinceUpdate.Reshape(m_rgShape);

            m_blobTimeSinceUpdate1.Reshape(m_rgShape);

            m_blobTsFull.ReshapeLike(m_blobTimeSinceUpdate1);


            m_rgShape[1] = m_param.cfc_param.output_features;

            m_blobForwardOutput.Reshape(m_rgShape);

            m_blobForwardOutput1.Reshape(m_rgShape);

            m_blobForwardOutput2.Reshape(m_rgShape);


            addBtmTop(m_blobForwardInput, m_blobInputs1);

            if (m_nTrueInFeatures * 2 < m_param.cfc_param.input_features && m_nMaskCount == m_nTrueInFeatures)

                m_colBtm.Add(m_blobTimeSinceUpdate);

            m_colBtm.Add(m_blobMask);

            m_cat.Reshape(m_colBtm, m_colTop);


            for (int i = 0; i < m_nSeqLen; i++)

            {

                addBtmTop(m_blobInputs1, m_blobHState);

                m_colBtm.Add(m_blobHState1);

                m_colBtm.Add(m_blobTs);


                ((LnnUnitLayer<T>)m_rnn_cell).SetInternalSharedBlobs(m_rgrgInternalBlobs[i]);


                m_rnn_cell.Reshape(m_colBtm, m_colTop);

            }


            m_blobHState.Unsqueeze(4);


            addBtmTop(m_blobHState, m_blobCurrentOutput);

            m_fc.Reshape(m_colBtm, m_colTop);


            m_blobCurrentMaskFull.ReshapeLike(m_blobCurrentOutput);


            addBtmTop(m_blobHState, colTop[0]);

            m_fc.Reshape(m_colBtm, m_colTop);

        }


        protected override void forward(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            m_blobForwardInput.SetData(0);

            m_blobForwardOutput.SetData(0);

            m_blobTimeSinceUpdate.SetData(0);

            m_blobHState.SetData(0);


            for (int t = 0; t < m_nSeqLen; t++)

            {

                // Copy the t'th time step of the input to the input blob.

                m_cuda.channel_copy(m_blobInputs.count(), m_blobInputs.num, 1, m_nSeqLen, m_nTrueInFeatures, t, colBottom[0].gpu_data, m_blobInputs.mutable_gpu_data, DIR.FWD);

                // Copy the t'th timestep of the time since update to the ts blob.

                m_cuda.channel_copy(m_blobTs.count(), m_blobTs.num, 1, m_nSeqLen, 1, t, colBottom[1].gpu_data, m_blobTs.mutable_gpu_data, DIR.FWD);

                m_cuda.channel_fillfrom(m_blobTsFull.count(), 1, m_blobTs.num, m_blobTsFull.channels, m_blobTs.gpu_data, m_blobTsFull.mutable_gpu_data, DIR.FWD);


                // Apply masking

                if (colBottom.Count() > 2)

                {

                    int nMaskCount = colBottom[2].count(2);

                    if (nMaskCount == m_nTrueInFeatures)

                    {

                        // Copy the t'th mask of the full mask to the mask blob.

                        m_cuda.channel_copy(m_blobMask.count(), m_blobMask.num, 1, m_nSeqLen, nMaskCount, t, colBottom[2].gpu_data, m_blobMask.mutable_gpu_data, DIR.FWD);

                        // Create the mask inverse

                        m_cuda.sub(m_blobMask.count(), m_blobMaskInv.gpu_diff, m_blobMask.gpu_data, m_blobMaskInv.mutable_gpu_data);


                        // Update the forwarded input.

                        m_cuda.mul(m_blobMask.count(), m_blobInputs.gpu_data, m_blobMask.gpu_data, m_blobForwardInput1.mutable_gpu_data);

                        m_cuda.mul(m_blobMask.count(), m_blobForwardInput.gpu_data, m_blobMaskInv.gpu_data, m_blobForwardInput2.mutable_gpu_data);

                        m_cuda.add(m_blobMask.count(), m_blobForwardInput1.gpu_data, m_blobForwardInput2.gpu_data, m_blobForwardInput.mutable_gpu_data);


                        // Update the time since update.

                        m_cuda.add(m_blobTimeSinceUpdate.count(), m_blobTimeSinceUpdate.gpu_data, m_blobTsFull.gpu_data, m_blobTimeSinceUpdate1.mutable_gpu_data);

                        m_cuda.mul(m_blobTimeSinceUpdate1.count(), m_blobTimeSinceUpdate1.gpu_data, m_blobMaskInv.gpu_data, m_blobTimeSinceUpdate.mutable_gpu_data);

                    }

                    else

                    {

                        m_cuda.copy(m_blobForwardInput.count(), m_blobInputs.gpu_data, m_blobForwardInput.mutable_gpu_data);

                    }


                    // Update a 3x in-features mask.

                    if (m_nTrueInFeatures * 2 < m_param.cfc_param.input_features && m_nMaskCount == m_nTrueInFeatures)

                    {

                        addBtmTop(m_blobForwardInput, m_blobInputs1);

                        m_colBtm.Add(m_blobTimeSinceUpdate);

                        m_colBtm.Add(m_blobMask);

                        m_cat.Forward(m_colBtm, m_colTop);

                    }

                    // Update a 2x in-features mask.

                    else

                    {

                        addBtmTop(m_blobForwardInput, m_blobInputs1);

                        m_colBtm.Add(m_blobMask);

                        m_cat.Forward(m_colBtm, m_colTop);

                    }

                }

                else

                {

                    m_blobInputs1.CopyFrom(m_blobInputs);

                }


                // Run the CfcCell forward pass.

                addBtmTop(m_blobInputs1, m_blobHState1);

                m_colBtm.Add(m_blobHState);

                m_colBtm.Add(m_blobTs);


                ((LnnUnitLayer<T>)m_rnn_cell).SetInternalSharedBlobs(m_rgrgInternalBlobs[t]);


                m_rnn_cell.Forward(m_colBtm, m_colTop);


                m_blobHState1.Unsqueeze(4);

                m_rgBlobHState[t].CopyFrom(m_blobHState1);


                // Apply masking

                if (colBottom.Count > 2)

                {

                    m_cuda.channel_max(m_blobMask.count(), m_blobMask.num, m_blobMask.channels, 1, m_blobMask.gpu_data, m_blobCurrentMask.mutable_gpu_data);


                    // Create mask inverse

                    m_blobCurrentMask.SetDiff(1.0);

                    m_cuda.sub(m_blobCurrentMask.count(), m_blobCurrentMask.gpu_diff, m_blobCurrentMask.gpu_data, m_blobCurrentMask.mutable_gpu_diff);


                    m_cuda.channel_fillfrom(m_blobCurrentMaskFull.count(), m_blobCurrentMask.num, m_blobCurrentMask.channels, m_blobCurrentMaskFull.channels, m_blobCurrentMask.gpu_data, m_blobCurrentMaskFull.mutable_gpu_data, DIR.FWD);

                    m_cuda.channel_fillfrom(m_blobCurrentMaskFull.count(), m_blobCurrentMask.num, m_blobCurrentMask.channels, m_blobCurrentMaskFull.channels, m_blobCurrentMask.gpu_diff, m_blobCurrentMaskFull.mutable_gpu_diff, DIR.FWD);


                    addBtmTop(m_blobHState1, m_blobCurrentOutput);

                    m_fc.Forward(m_colBtm, m_colTop);


                    // Update the forwarded output.

                    m_cuda.mul(m_blobCurrentMaskFull.count(), m_blobCurrentOutput.gpu_data, m_blobCurrentMaskFull.gpu_data, m_blobForwardOutput1.mutable_gpu_data);

                    m_cuda.mul(m_blobCurrentMaskFull.count(), m_blobForwardOutput.gpu_data, m_blobCurrentMaskFull.gpu_diff, m_blobForwardOutput2.mutable_gpu_data);

                    m_cuda.add(m_blobCurrentMaskFull.count(), m_blobForwardOutput1.gpu_data, m_blobForwardOutput2.gpu_data, m_blobForwardOutput.mutable_gpu_data);

                }


                m_blobHState.CopyFrom(m_blobHState1);

            }


            if (m_param.cfc_param.return_sequences)

            {

                throw new NotImplementedException("return sequences is not implemented yet.");

            }

            else if (colBottom.Count > 2)

            {

                colTop[0].CopyFrom(m_blobForwardOutput);

            }

            else

            {

                addBtmTop(m_blobHState, colTop[0]);

                m_fc.Forward(m_colBtm, m_colTop);

            }

        }


        protected override void backward(BlobCollection<T> colTop, List<bool> rgbPropagateDown, BlobCollection<T> colBottom)

        {

            m_blobHState.SetDiff(0);

            m_blobInputs.SetDiff(0);

            m_blobForwardInput.SetDiff(0);


            if (m_param.cfc_param.return_sequences)

            {

                throw new NotImplementedException("return sequences is not implemented yet.");

            }

            else if (colBottom.Count > 2)

            {

                m_blobForwardOutput.CopyFrom(colTop[0], true);

            }

            else

            {

                addBtmTop(m_blobHState, colTop[0]);

                m_fc.Backward(m_colTop, rgbPropagateDown, m_colBtm);

            }


            int nMaskCount = colBottom[2].count(2);

            for (int t = m_nSeqLen - 1; t >= 0; t--)

            {

                m_blobHState1.CopyFrom(m_rgBlobHState[t]);


                if (colBottom.Count > 2)

                {

                    // Copy the t'th mask of the full mask to the mask blob.

                    m_cuda.channel_copy(m_blobMask.count(), m_blobMask.num, 1, m_nSeqLen, nMaskCount, t, colBottom[2].gpu_data, m_blobMask.mutable_gpu_data, DIR.FWD);

                    // Create the mask inverse

                    m_cuda.sub(m_blobMask.count(), m_blobMaskInv.gpu_diff, m_blobMask.gpu_data, m_blobMaskInv.mutable_gpu_data);


                    m_cuda.channel_max(m_blobMask.count(), m_blobMask.num, m_blobMask.channels, 1, m_blobMask.gpu_data, m_blobCurrentMask.mutable_gpu_data);


                    // Create mask inverse

                    m_blobCurrentMask.SetDiff(1.0);

                    m_cuda.sub(m_blobCurrentMask.count(), m_blobCurrentMask.gpu_diff, m_blobCurrentMask.gpu_data, m_blobCurrentMask.mutable_gpu_diff);


                    m_cuda.channel_fillfrom(m_blobCurrentMaskFull.count(), m_blobCurrentMask.num, m_blobCurrentMask.channels, m_blobCurrentMaskFull.channels, m_blobCurrentMask.gpu_data, m_blobCurrentMaskFull.mutable_gpu_data, DIR.FWD);

                    m_cuda.channel_fillfrom(m_blobCurrentMaskFull.count(), m_blobCurrentMask.num, m_blobCurrentMask.channels, m_blobCurrentMaskFull.channels, m_blobCurrentMask.gpu_diff, m_blobCurrentMaskFull.mutable_gpu_diff, DIR.FWD);


                    m_blobForwardOutput1.CopyFrom(m_blobForwardOutput, true);

                    m_blobForwardOutput2.CopyFrom(m_blobForwardOutput, true);


                    // Update the forwarded output.

                    m_cuda.mul(m_blobCurrentMaskFull.count(), m_blobForwardOutput1.gpu_diff, m_blobCurrentMaskFull.gpu_data, m_blobCurrentOutput.mutable_gpu_diff);

                    m_cuda.mul(m_blobCurrentMaskFull.count(), m_blobForwardOutput2.gpu_diff, m_blobCurrentMaskFull.gpu_diff, m_blobForwardOutput.mutable_gpu_diff);


                    addBtmTop(m_blobHState1, m_blobCurrentOutput);

                    m_fc.Backward(m_colTop, rgbPropagateDown, m_colBtm);

                }


                if (t < m_nSeqLen - 1)

                    m_cuda.add(m_blobHState1.count(), m_blobHState1.gpu_diff, m_rgBlobHState[t + 1].gpu_diff, m_blobHState1.mutable_gpu_diff);


                // Run the CfcCell backward pass.

                addBtmTop(m_blobInputs1, m_blobHState1);

                m_colBtm.Add(m_blobHState);

                m_colBtm.Add(m_blobTs);


                ((LnnUnitLayer<T>)m_rnn_cell).SetInternalSharedBlobs(m_rgrgInternalBlobs[t]);


                m_rnn_cell.Backward(m_colTop, new List<bool>() { true, true, true }, m_colBtm);

                m_rgBlobHState[t].CopyFrom(m_blobHState, true);


                // Apply masking

                if (colBottom.Count() > 2)

                {

                    if (m_nTrueInFeatures * 2 < m_param.cfc_param.input_features && m_nMaskCount == m_nTrueInFeatures)

                    {

                        addBtmTop(m_blobForwardInput1, m_blobInputs1);

                        m_colBtm.Add(m_blobTimeSinceUpdate);

                        m_colBtm.Add(m_blobMask);

                        m_cat.Backward(m_colTop, new List<bool>() { true, true, true }, m_colBtm);

                    }

                    else

                    {

                        addBtmTop(m_blobForwardInput1, m_blobInputs1);

                        m_colBtm.Add(m_blobMask);

                        m_cat.Backward(m_colTop, new List<bool>() { true, true }, m_colBtm);

                    }


                    // Accumulate grad with previous masked forward input.

                    m_cuda.mul(m_blobForwardInput.count(), m_blobForwardInput.gpu_diff, m_blobForwardInput2.gpu_diff, m_blobForwardInput.mutable_gpu_diff);

                    m_cuda.add(m_blobForwardInput.count(), m_blobForwardInput.gpu_diff, m_blobForwardInput1.gpu_diff, m_blobForwardInput.mutable_gpu_diff);


                    if (nMaskCount == m_nTrueInFeatures)

                    {

                        // Input grad = mask * Inputs1

                        m_cuda.mul(m_blobForwardInput.count(), m_blobForwardInput.gpu_diff, m_blobMask.gpu_data, m_blobInputs.mutable_gpu_diff);

                        // Forwarded input grad = mask_inv * Forwarded input grad

                        //m_cuda.mul(m_blobForwardInput.count(), m_blobForwardInput.gpu_diff, m_blobMaskInv.gpu_data, m_blobForwardInput.mutable_gpu_diff);

                    }

                    else

                    {

                        m_cuda.copy(m_blobForwardInput.count(), m_blobForwardInput.gpu_diff, m_blobInputs.mutable_gpu_diff);

                    }

                }

                else

                {

                    m_blobInputs.CopyFrom(m_blobInputs1, true);

                }


                // Copy the t'th timestep of the time since update to the ts blob.

                //m_cuda.channel_fillfrom(m_blobTsFull.count(), 1, m_blobTs.num, m_blobTsFull.channels, m_blobTs.gpu_diff, m_blobTsFull.mutable_gpu_diff, DIR.BWD);


                //m_cuda.channel_copy(m_blobTs.count(), m_blobTs.num, 1, m_nSeqLen, 1, t, colBottom[1].gpu_diff, m_blobTs.mutable_gpu_diff, DIR.BWD);

                // Copy the t'th time step of the input to the input blob.

                m_cuda.channel_copy(m_blobInputs.count(), m_blobInputs.num, 1, m_nSeqLen, m_nTrueInFeatures, t, colBottom[0].gpu_diff, m_blobInputs.mutable_gpu_diff, DIR.BWD);


                // Save previous mask.

                m_cuda.copy(m_blobForwardInput2.count(), m_blobMaskInv.gpu_data, m_blobForwardInput2.mutable_gpu_diff);

            }

        }

    }

}

MyCaffe.basecode.Log
The Log class provides general output in text form.
Definition: Log.cs:13

MyCaffe.common.BlobCollection
The BlobCollection contains a list of Blobs.
Definition: BlobCollection.cs:16

MyCaffe.common.BlobCollection.Add
void Add(Blob< T > b)
Add a new Blob to the collection.
Definition: BlobCollection.cs:92

MyCaffe.common.BlobCollection.Count
int Count
Returns the number of items in the collection.
Definition: BlobCollection.cs:30

MyCaffe.common.BlobCollection.Clear
void Clear(bool bDispose=false)
Remove all items from the collection.
Definition: BlobCollection.cs:135

MyCaffe.common.BlobCollection.Reshape
void Reshape(int[] rgShape)
Reshapes all blobs in the collection to the given shape.
Definition: BlobCollection.cs:238

MyCaffe.common.BlobCollection.CopyFrom
void CopyFrom(BlobCollection< T > bSrc, bool bCopyDiff=false)
Copy the data or diff from another BlobCollection into this one.
Definition: BlobCollection.cs:266

MyCaffe.common.Blob
The Blob is the main holder of data that moves through the Layers of the Net.
Definition: Blob.cs:25

MyCaffe.common.Blob.channels
int channels
DEPRECIATED; legacy shape accessor channels: use shape(1) instead.
Definition: Blob.cs:800

MyCaffe.common.Blob.SetData
void SetData(T[] rgData, int nCount=-1, bool bSetCount=true)
Sets a number of items within the Blob's data.
Definition: Blob.cs:1922

MyCaffe.common.Blob.mutable_gpu_diff
long mutable_gpu_diff
Returns the diff GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1555

MyCaffe.common.Blob.mutable_gpu_data
long mutable_gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1487

MyCaffe.common.Blob.Unsqueeze
void Unsqueeze(int nNumAxes)
Unsqueeze the shape by adding shape=1 on each axis until the 'nNumAxes' is reached.
Definition: Blob.cs:201

MyCaffe.common.Blob.Reshape
void Reshape(int nNum, int nChannels, int nHeight, int nWidth, bool? bUseHalfSize=null)
DEPRECIATED; use
Definition: Blob.cs:442

MyCaffe.common.Blob.CopyFrom
void CopyFrom(Blob< T > src, int nSrcOffset, int nDstOffset, int nCount, bool bCopyData, bool bCopyDiff)
Copy from a source Blob.
Definition: Blob.cs:903

MyCaffe.common.Blob.count
int count()
Returns the total number of items in the Blob.
Definition: Blob.cs:739

MyCaffe.common.Blob.ReshapeLike
void ReshapeLike(Blob< T > b, bool? bUseHalfSize=null)
Reshape this Blob to have the same shape as another Blob.
Definition: Blob.cs:648

MyCaffe.common.Blob.Name
string Name
Get/set the name of the Blob.
Definition: Blob.cs:2184

MyCaffe.common.Blob.gpu_diff
long gpu_diff
Returns the diff GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1541

MyCaffe.common.Blob.SetDiff
void SetDiff(double dfVal, int nIdx=-1)
Either sets all of the diff items in the Blob to a given value, or alternatively only sets a single i...
Definition: Blob.cs:1981

MyCaffe.common.Blob.num
int num
DEPRECIATED; legacy shape accessor num: use shape(0) instead.
Definition: Blob.cs:792

MyCaffe.common.Blob.gpu_data
long gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1479

MyCaffe.common.CudaDnn
The CudaDnn object is the main interface to the Low-Level Cuda C++ DLL.
Definition: CudaDnn.cs:969

MyCaffe.layers.Layer
An interface for the units of computation which can be composed into a Net.
Definition: Layer.cs:31

MyCaffe.layers.Layer.m_log
Log m_log
Specifies the Log for output.
Definition: Layer.cs:43

MyCaffe.layers.Layer.m_param
LayerParameter m_param
Specifies the LayerParameter describing the Layer.
Definition: Layer.cs:47

MyCaffe.layers.Layer.Backward
void Backward(BlobCollection< T > colTop, List< bool > rgbPropagateDown, BlobCollection< T > colBottom)
Given the top Blob error gradients, compute the bottom Blob error gradients.
Definition: Layer.cs:815

MyCaffe.layers.Layer.Forward
double Forward(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Given the bottom (input) Blobs, this function computes the top (output) Blobs and the loss.
Definition: Layer.cs:728

MyCaffe.layers.Layer.Reshape
abstract void Reshape(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Adjust the shapes of top blobs and internal buffers to accomodate the shapes of the bottom blobs.

MyCaffe.layers.Layer.m_cuda
CudaDnn< T > m_cuda
Specifies the CudaDnn connection to Cuda.
Definition: Layer.cs:39

MyCaffe.layers.Layer.Setup
void Setup(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Implements common Layer setup functionality.
Definition: Layer.cs:439

MyCaffe.layers.Layer.Create
static Layer< T > Create(CudaDnn< T > cuda, Log log, LayerParameter p, CancelEvent evtCancel, IXDatabaseBase db=null, TransferInput trxinput=null)
Create a new Layer based on the LayerParameter.
Definition: Layer.cs:1468

MyCaffe.layers.Layer.m_type
LayerParameter.LayerType m_type
Specifies the Layer type.
Definition: Layer.cs:35

MyCaffe.layers.Layer.blobs
BlobCollection< T > blobs
Returns the collection of learnable parameter Blobs for the Layer.
Definition: Layer.cs:875

MyCaffe.layers.Layer.convertLayerParam
LayerParameter convertLayerParam(LayerParameter pChild, LayerParameter pParent)
Called to convert a parent LayerParameterEx, used in blob sharing, with a child layer parameter.
Definition: Layer.cs:1134

MyCaffe.layers.lnn.CfcLayer
The CfcLayer implements the Closed form Continuous layer.
Definition: CfcLayer.cs:24

MyCaffe.layers.lnn.CfcLayer.ExactNumTopBlobs
override int ExactNumTopBlobs
Returns the exact number of required top (output) Blobs: attn
Definition: CfcLayer.cs:213

MyCaffe.layers.lnn.CfcLayer.CfcLayer
CfcLayer(CudaDnn< T > cuda, Log log, LayerParameter p)
The CfcLayer constructor.
Definition: CfcLayer.cs:69

MyCaffe.layers.lnn.CfcLayer.LayerSetUp
override void LayerSetUp(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Setup the layer.
Definition: CfcLayer.cs:233

MyCaffe.layers.lnn.CfcLayer.forward
override void forward(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Forward computation
Definition: CfcLayer.cs:410

MyCaffe.layers.lnn.CfcLayer.ExactNumBottomBlobs
override int ExactNumBottomBlobs
Returns the exact number of required bottom (input) Blobs: input, hx, ts
Definition: CfcLayer.cs:205

MyCaffe.layers.lnn.CfcLayer.backward
override void backward(BlobCollection< T > colTop, List< bool > rgbPropagateDown, BlobCollection< T > colBottom)
Computes the error gradient w.r.t. the Cfc value inputs.
Definition: CfcLayer.cs:538

MyCaffe.layers.lnn.CfcLayer.dispose
override void dispose()
Releases all GPU and host resources used by the Layer.
Definition: CfcLayer.cs:152

MyCaffe.layers.lnn.CfcLayer.ReInitializeParameters
override bool ReInitializeParameters(WEIGHT_TARGET target)
Re-initialize the parameters of the layer.
Definition: CfcLayer.cs:222

MyCaffe.layers.lnn.CfcLayer.setup_internal_blobs
override void setup_internal_blobs(BlobCollection< T > col)
Derivative layers should add all internal blobws to the 'col' provided.
Definition: CfcLayer.cs:195

MyCaffe.layers.lnn.CfcLayer.Reshape
override void Reshape(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Reshape the bottom (input) and top (output) blobs.
Definition: CfcLayer.cs:316

MyCaffe.layers.lnn.LnnUnitLayer
The LnnUnitLayer implements the base class to the Cfc and Ltc Unit layers.
Definition: LnnUnitLayer.cs:19

MyCaffe.param.ConcatParameter.axis
int axis
The axis along which to concatenate – may be negative to index from the end (e.g.,...
Definition: ConcatParameter.cs:40

MyCaffe.param.FillerParameter
Specifies the filler parameters used to create each Filler.
Definition: FillerParameter.cs:16

MyCaffe.param.InnerProductParameter.weight_filler
FillerParameter weight_filler
The filler for the weights.
Definition: InnerProductParameter.cs:119

MyCaffe.param.InnerProductParameter.axis
int axis
Specifies the first axis to be lumped into a single inner product computation; all preceding axes are...
Definition: InnerProductParameter.cs:142

MyCaffe.param.InnerProductParameter.bias_filler
FillerParameter bias_filler
The filler for the bias.
Definition: InnerProductParameter.cs:130

MyCaffe.param.InnerProductParameter.num_output
uint num_output
The number of outputs for the layer.
Definition: InnerProductParameter.cs:85

MyCaffe.param.InnerProductParameter.bias_term
bool bias_term
Whether to have bias terms or not.
Definition: InnerProductParameter.cs:108

MyCaffe.param.LayerParameter
Specifies the base parameter for all layers.
Definition: LayerParameter.cs:24

MyCaffe.param.LayerParameter.cfc_param
CfcParameter cfc_param
Returns the parameter set when initialized with LayerType.CFC
Definition: LayerParameter.cs:2072

MyCaffe.param.LayerParameter.ltc_unit_param
LtcUnitParameter ltc_unit_param
Returns the parameter set when initialized with LayerType.LTC_UNIT
Definition: LayerParameter.cs:2515

MyCaffe.param.LayerParameter.inner_product_param
InnerProductParameter inner_product_param
Returns the parameter set when initialized with LayerType.INNERPRODUCT
Definition: LayerParameter.cs:2452

MyCaffe.param.LayerParameter.concat_param
ConcatParameter concat_param
Returns the parameter set when initialized with LayerType.CONCAT
Definition: LayerParameter.cs:2099

MyCaffe.param.LayerParameter.cfc_unit_param
CfcUnitParameter cfc_unit_param
Returns the parameter set when initialized with LayerType.CFC_UNIT
Definition: LayerParameter.cs:2081

MyCaffe.param.LayerParameter.LayerType
LayerType
Specifies the layer type.
Definition: LayerParameter.cs:110

MyCaffe.param.lnn.CfcParameter
Specifies the parameters used by the CfcLayer. Note, you must also fill out the CfcUnitParameter.
Definition: CfcParameter.cs:21

MyCaffe.param.lnn.CfcParameter.cell_type
CELL_TYPE cell_type
Specifies the cell type to use (default = CFC).
Definition: CfcParameter.cs:53

MyCaffe.param.lnn.CfcParameter.CELL_TYPE
CELL_TYPE
Defines the cell type.
Definition: CfcParameter.cs:32

MyCaffe.param.lnn.CfcParameter.input_features
int input_features
Specifies the number of input features.
Definition: CfcParameter.cs:63

MyCaffe.param.lnn.CfcParameter.output_features
int output_features
Specifies the number of output features
Definition: CfcParameter.cs:83

MyCaffe.param.lnn.CfcParameter.return_sequences
bool return_sequences
Specifies whether or not to return the sequence.
Definition: CfcParameter.cs:93

MyCaffe.param.lnn.CfcUnitParameter.hidden_size
int hidden_size
Specifies the hidden size used to size the backbone units and other internal layers.
Definition: CfcUnitParameter.cs:98

MyCaffe.param.lnn.CfcUnitParameter.Copy
override void Copy(LayerParameterBase src)
Copy on parameter to another.
Definition: CfcUnitParameter.cs:156

MyCaffe.param.lnn.LtcUnitParameter.hidden_size
int hidden_size
Specifies the number of hidden units (default = 256).
Definition: LtcUnitParameter.cs:65

MyCaffe.param.lnn.LtcUnitParameter.Copy
override void Copy(LayerParameterBase src)
Copy on parameter to another.
Definition: LtcUnitParameter.cs:283

MyCaffe.basecode
The MyCaffe.basecode contains all generic types used throughout MyCaffe.
Definition: Annotation.cs:12

MyCaffe.common
The MyCaffe.common namespace contains common MyCaffe classes.
Definition: BatchInput.cs:8

MyCaffe.common.DIR
DIR
Defines the direction of data flow.
Definition: CudaDnn.cs:22

MyCaffe.common.WEIGHT_TARGET
WEIGHT_TARGET
Defines the type of weight to target in re-initializations.
Definition: Interfaces.cs:38

MyCaffe.layers.lnn
The MyCaffe.layers.lnn namespace contains all Liquid Neural Network (LNN) related layers.
Definition: LayerFactory.cs:15

MyCaffe.param.lnn
Definition: CfcParameter.cs:9

MyCaffe.param
The MyCaffe.param namespace contains parameters used to create models.
Definition: AttentionParameter.cs:9

MyCaffe
The MyCaffe namespace contains the main body of MyCaffe code that closesly tracks the C++ Caffe open-...
Definition: Annotation.cs:12

System
Definition: Component.cs:11