mycaffe/html/_eltwise_layer_8cs_source.html

using System;

using System.Collections.Generic;

using System.Linq;

using System.Text;

using MyCaffe.basecode;

using MyCaffe.common;

using MyCaffe.param;


namespace MyCaffe.layers

{

    public class EltwiseLayer<T> : Layer<T>

    {

        EltwiseParameter.EltwiseOp m_op;

        List<double> m_rgdfCoeffs = new List<double>();

        Blob<T> m_blobIdx;

        Blob<T> m_blobSingleSecondary = null;

        bool m_bStableProdGrad;

        bool m_bCoeffBlob;


        public EltwiseLayer(CudaDnn<T> cuda, Log log, LayerParameter p)

            : base(cuda, log, p)

        {

            m_type = LayerParameter.LayerType.ELTWISE;

            m_blobIdx = new Blob<T>(cuda, log);

            m_blobIdx.Name = m_param.name + " idx";

        }


        protected override void dispose()

        {

            m_blobIdx.Dispose();


            if (m_blobSingleSecondary != null)

                m_blobSingleSecondary.Dispose();


            base.dispose();

        }


        protected override void setup_internal_blobs(BlobCollection<T> col)

        {

            if (col.Count > 0)

                return;


            col.Add(m_blobIdx);

        }


        public override int MinBottomBlobs

        {

            get { return 2; }

        }


        public override int ExactNumTopBlobs

        {

            get { return 1; }

        }


        public override void LayerSetUp(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            m_log.CHECK(m_param.eltwise_param.coeff.Count == 0 ||

                        m_param.eltwise_param.coeff.Count == colBottom.Count, "Eltwise layer takes one coefficient per bottom blob.");


            m_log.CHECK(!((m_param.eltwise_param.operation == EltwiseParameter.EltwiseOp.PROD || m_param.eltwise_param.operation == EltwiseParameter.EltwiseOp.DIV) &&

                          m_param.eltwise_param.coeff.Count > 0), "Eltwise layer only takes coefficients for SUM and SUB operations.");


            m_op = m_param.eltwise_param.operation;

            m_bCoeffBlob = m_param.eltwise_param.coeff_blob;


            if (m_bCoeffBlob)

                m_log.CHECK(m_op == EltwiseParameter.EltwiseOp.SUM || m_op == EltwiseParameter.EltwiseOp.SUB, "coeff_blob option only implemented for the SUM and SUB operation.");


            int nCoeffSize = m_param.eltwise_param.coeff.Count;

            m_log.CHECK(nCoeffSize == 0 || (!m_bCoeffBlob && nCoeffSize == colBottom.Count)

                                        || (m_bCoeffBlob && nCoeffSize == colBottom.Count - 1), "Eltwise Layer takes one coefficient per bottom blob.");

            m_log.CHECK(m_op == EltwiseParameter.EltwiseOp.SUM || m_op == EltwiseParameter.EltwiseOp.SUB ||

                        layer_param.eltwise_param.coeff.Count == 0, "Eltwise layer only takes coefficients for SUM and SUB operations.");


            // Blob-wise coefficients for the elementwise operation.

            m_rgdfCoeffs = Utility.Create<double>(colBottom.Count, 1.0);


            int nCoeffBlobCount = (m_bCoeffBlob) ? 1 : 0;


            for (int i = 0; i < m_param.eltwise_param.coeff.Count - nCoeffBlobCount; i++)

            {

                m_rgdfCoeffs[i] = m_param.eltwise_param.coeff[i];

            }


            m_bStableProdGrad = m_param.eltwise_param.stable_prod_grad;

        }


        public override void Reshape(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            if (m_param.eltwise_param.allow_single_batch_input)

                m_log.CHECK_EQ(colBottom.Count, 2, "Only two inputs allowed when 'allow_single_batch_input' = true.");


            if (colBottom[1].count() == 1)

                m_log.CHECK_EQ(colBottom.Count, 2, "Only two inputs allowed when colBottom[1].count() == 1.");


            for (int i = 1; i < colBottom.Count; i++)

            {

                if (m_bCoeffBlob && i == colBottom.Count - 1)

                {

                    m_log.CHECK_EQ(i, colBottom[i].shape(0), "Dimensions of coeff blob axis 0 must equal the number of bottom blobs (not including the coeff blob itself).");


                    for (int input_axis = 0, coeff_axis = 1; coeff_axis < colBottom[i].num_axes; input_axis++, coeff_axis++)

                    {

                        m_log.CHECK_EQ(colBottom[0].shape(input_axis), colBottom[i].shape(coeff_axis), "Each axis i >= 1 of the coeff blob must match the (i-1)th axis of the input.");

                    }

                }

                else

                {

                    if (colBottom.Count == 2 && colBottom[1].count() == 1)

                    {

                        if (m_blobSingleSecondary == null)

                        {

                            m_blobSingleSecondary = new Blob<T>(m_cuda, m_log);

                            m_blobSingleSecondary.ReshapeLike(colBottom[0]);


                            double dfVal = Utility.ConvertVal<T>(colBottom[i].GetData(0));

                            m_blobSingleSecondary.SetData(dfVal);

                        }

                    }

                    else

                    {

                        if (!m_param.eltwise_param.allow_single_batch_input)

                            m_log.CHECK(Utility.Compare<int>(colBottom[i].shape(), colBottom[0].shape(), false), "The bottoms should all be of the same shape.");

                        else

                        {

                            if (m_blobSingleSecondary == null)

                                m_blobSingleSecondary = new Blob<T>(m_cuda, m_log);

                            m_blobSingleSecondary.ReshapeLike(colBottom[0]);


                            m_log.CHECK_EQ(colBottom[i].num, 1, "The batch for the second input must be 1.");

                            m_log.CHECK_EQ(colBottom[i].count(1), colBottom[0].count(1), "All shapes other than the first shape must match!");

                        }

                    }

                }

            }


            colTop[0].ReshapeLike(colBottom[0]);


            // If max operation, we will initialize the vector index part.

            if ((m_param.eltwise_param.operation == EltwiseParameter.EltwiseOp.MAX || m_param.eltwise_param.operation == EltwiseParameter.EltwiseOp.MIN) && colTop.Count == 1)

                m_blobIdx.Reshape(colBottom[0].shape());

        }


        protected override void forward(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            Blob<T> blob = (m_blobSingleSecondary != null) ? m_blobSingleSecondary : colBottom[1];

            long hMask = 0;

            int nCount = colTop[0].count();

            long hTopData = colTop[0].mutable_gpu_data;

            long hCoeffData = 0;

            int nCoeffCount = 0;


            if (m_param.eltwise_param.allow_single_batch_input)

            {

                // Copy each colBottom[1] to each batch item in blobSingleSecondary.

                m_cuda.channel_copyall(blob.count(),

                                       blob.num,

                                       blob.channels,

                                       blob.count(2),

                                       colBottom[1].gpu_data,

                                       blob.mutable_gpu_data);

            }


            switch (m_op)

            {

                case EltwiseParameter.EltwiseOp.PROD:

                    m_cuda.mul(nCount, colBottom[0].gpu_data, blob.gpu_data, hTopData);


                    for (int i = 2; i < colBottom.Count; i++)

                    {

                        m_cuda.mul(nCount, hTopData, colBottom[i].gpu_data, hTopData);

                    }

                    break;


                case EltwiseParameter.EltwiseOp.DIV:

                    m_cuda.div(nCount, colBottom[0].gpu_data, blob.gpu_data, hTopData);


                    for (int i = 2; i < colBottom.Count; i++)

                    {

                        m_cuda.div(nCount, hTopData, colBottom[i].gpu_data, hTopData);

                    }

                    break;


                case EltwiseParameter.EltwiseOp.SUM:

                    if (m_bCoeffBlob)

                    {

                        int nNum = colTop[0].num;

                        int nDim = nCount / nNum;

                        hCoeffData = colBottom[colBottom.Count - 1].gpu_data;

                        nCoeffCount = 1;


                        for (int i = 0; i < colBottom.Count - nCoeffCount; i++)

                        {

                            long hBottomData = (i == 0 || colBottom.Count > 3) ? colBottom[i].gpu_data : blob.gpu_data;

                            m_cuda.coeff_sum_fwd(nCount, nDim, i * nNum, m_rgdfCoeffs[i], hCoeffData, hBottomData, hTopData);

                        }

                    }

                    else

                    {

                        m_cuda.set(nCount, hTopData, 0);

                        // TODO(shelhamer) does cuBLAS optimize to sum of coeff = 1?

                        for (int i = 0; i < colBottom.Count; i++)

                        {

                            long hBottomData = (i == 0 || colBottom.Count > 2) ? colBottom[i].gpu_data : blob.gpu_data;

                            m_cuda.axpy(nCount, m_rgdfCoeffs[i], hBottomData, hTopData);

                        }

                    }

                    break;


                case EltwiseParameter.EltwiseOp.SUB:

                    if (m_bCoeffBlob)

                    {

                        int nNum = colTop[0].num;

                        int nDim = nCount / nNum;

                        hCoeffData = colBottom[colBottom.Count - 1].gpu_data;

                        nCoeffCount = 1;


                        for (int i = 0; i < colBottom.Count - nCoeffCount; i++)

                        {

                            long hBottomData = (i == 0 || colBottom.Count > 3) ? colBottom[i].gpu_data : blob.gpu_data;

                            m_cuda.coeff_sub_fwd(nCount, nDim, i * nNum, m_rgdfCoeffs[i], hCoeffData, hBottomData, hTopData);

                        }

                    }

                    else

                    {

                        m_cuda.scale(nCount, m_rgdfCoeffs[0], colBottom[0].gpu_data, hTopData);


                        for (int i = 1; i < colBottom.Count; i++)

                        {

                            long hBottomData = (i == 0 || colBottom.Count > 2) ? colBottom[i].gpu_data : blob.gpu_data;

                            m_cuda.axpy(nCount, -1 * m_rgdfCoeffs[i], hBottomData, hTopData);

                        }

                    }

                    break;


                case EltwiseParameter.EltwiseOp.MAX:

                    hMask = m_blobIdx.mutable_gpu_data;

                    m_cuda.max_fwd(nCount, colBottom[0].gpu_data, colBottom[1].gpu_data, 0, hTopData, hMask);


                    for (int i = 2; i < colBottom.Count; i++)

                    {

                        m_cuda.max_fwd(nCount, hTopData, colBottom[i].gpu_data, i-1, hTopData, hMask);

                    }

                    break;


                case EltwiseParameter.EltwiseOp.MIN:

                    hMask = m_blobIdx.mutable_gpu_data;

                    m_cuda.min_fwd(nCount, colBottom[0].gpu_data, colBottom[1].gpu_data, 0, hTopData, hMask);


                    for (int i = 2; i < colBottom.Count; i++)

                    {

                        m_cuda.min_fwd(nCount, hTopData, colBottom[i].gpu_data, i - 1, hTopData, hMask);

                    }

                    break;


                default:

                    m_log.FAIL("Unknown elementwise operation.");

                    break;

            }

        }


        protected override void backward(BlobCollection<T> colTop, List<bool> rgbPropagateDown, BlobCollection<T> colBottom)

        {

            long hMask = 0;

            int nCount = colTop[0].count();

            long hTopData = colTop[0].gpu_data;

            long hTopDiff = colTop[0].gpu_diff;

            long hCoeffData = 0;

            int nNum = colTop[0].num;

            int nDim = nCount / nNum;


            if (m_bCoeffBlob)

                hCoeffData = colBottom[colBottom.Count - 1].gpu_data;


            for (int i = 0; i < colBottom.Count; i++)

            {

                if (rgbPropagateDown[i])

                {

                    long hBottomData = colBottom[i].gpu_data;

                    long hBottomDiff = colBottom[i].mutable_gpu_diff;


                    if (i == 1 && m_blobSingleSecondary != null)

                    {

                        hBottomData = m_blobSingleSecondary.gpu_data;

                        hBottomDiff = m_blobSingleSecondary.mutable_gpu_diff;

                    }


                    switch (m_op)

                    {

                        case EltwiseParameter.EltwiseOp.PROD:

                            if (m_bStableProdGrad)

                            {

                                bool bInitialized = false;

                                for (int j = 0; j < colBottom.Count; j++)

                                {

                                    if (i == j)

                                        continue;


                                    if (!bInitialized)

                                    {

                                        m_cuda.copy(nCount, colBottom[j].gpu_data, hBottomDiff);

                                        bInitialized = true;

                                    }

                                    else

                                    {

                                        m_cuda.mul(nCount, colBottom[j].gpu_data, hBottomDiff, hBottomDiff);

                                    }

                                }

                            }

                            else

                            {

                                m_cuda.div(nCount, hTopData, hBottomData, hBottomDiff);

                            }

                            m_cuda.mul(nCount, hBottomDiff, hTopDiff, hBottomDiff);

                            break;


                        case EltwiseParameter.EltwiseOp.DIV:

                            m_cuda.mul(nCount, hTopData, hBottomData, hBottomDiff);

                            m_cuda.mul(nCount, hBottomDiff, hTopDiff, hBottomDiff);

                            break;


                        case EltwiseParameter.EltwiseOp.SUM:

                            if (m_bCoeffBlob)

                            {

                                m_cuda.coeff_sum_bwd(nCount, nDim, i * nNum, m_rgdfCoeffs[i], hCoeffData, hTopDiff, hBottomDiff);

                            }

                            else

                            {

                                if (m_rgdfCoeffs[i] == 1.0)

                                    m_cuda.copy(nCount, hTopDiff, hBottomDiff);

                                else

                                    m_cuda.scale(nCount, m_rgdfCoeffs[i], hTopDiff, hBottomDiff);

                            }

                            break;


                        case EltwiseParameter.EltwiseOp.SUB:

                            if (m_bCoeffBlob)

                            {

                                m_cuda.coeff_sub_bwd(nCount, nDim, i * nNum, m_rgdfCoeffs[i], hCoeffData, hTopDiff, hBottomDiff);

                            }

                            else

                            {

                                double dfScale = (i == 0) ? 1 : -1;

                                m_cuda.scale(nCount, dfScale * m_rgdfCoeffs[i], hTopDiff, hBottomDiff);

                            }

                            break;


                        case EltwiseParameter.EltwiseOp.MAX:

                            hMask = m_blobIdx.gpu_data;

                            m_cuda.max_bwd(nCount, hTopDiff, i, hMask, hBottomDiff);

                            break;


                        case EltwiseParameter.EltwiseOp.MIN:

                            hMask = m_blobIdx.gpu_data;

                            m_cuda.min_bwd(nCount, hTopDiff, i, hMask, hBottomDiff);

                            break;


                        default:

                            m_log.FAIL("Unknown elementwise operation.");

                            break;

                    }

                }

            }


            // sum the gradients across channels.

            if (m_param.eltwise_param.allow_single_batch_input && colBottom[1].num == 1 && m_blobSingleSecondary != null)

                m_cuda.channel_sum(nCount, 1, nNum, colTop[0].channels * colTop[0].count(2), m_blobSingleSecondary.gpu_diff, colBottom[1].mutable_gpu_diff);

        }

    }

}

MyCaffe.basecode.Log
The Log class provides general output in text form.
Definition: Log.cs:13

MyCaffe.basecode.Log.CHECK
void CHECK(bool b, string str)
Test a flag for true.
Definition: Log.cs:227

MyCaffe.basecode.Log.FAIL
void FAIL(string str)
Causes a failure which throws an exception with the desciptive text.
Definition: Log.cs:394

MyCaffe.basecode.Log.CHECK_EQ
void CHECK_EQ(double df1, double df2, string str)
Test whether one number is equal to another.
Definition: Log.cs:239

MyCaffe.basecode.Utility
The Utility class provides general utility funtions.
Definition: Utility.cs:35

MyCaffe.basecode.Utility.Create
static List< int > Create(int nCount, int nStart, int nInc)
Create a new List and fill it with values starting with start and incrementing by inc.
Definition: Utility.cs:721

MyCaffe.common.BlobCollection
The BlobCollection contains a list of Blobs.
Definition: BlobCollection.cs:16

MyCaffe.common.BlobCollection.Add
void Add(Blob< T > b)
Add a new Blob to the collection.
Definition: BlobCollection.cs:92

MyCaffe.common.BlobCollection.Count
int Count
Returns the number of items in the collection.
Definition: BlobCollection.cs:30

MyCaffe.common.BlobCollection.ReshapeLike
void ReshapeLike(BlobCollection< T > src)
Reshapes all blobs in the collection to the sizes of the source.
Definition: BlobCollection.cs:214

MyCaffe.common.Blob
The Blob is the main holder of data that moves through the Layers of the Net.
Definition: Blob.cs:25

MyCaffe.common.Blob.channels
int channels
DEPRECIATED; legacy shape accessor channels: use shape(1) instead.
Definition: Blob.cs:800

MyCaffe.common.Blob.SetData
void SetData(T[] rgData, int nCount=-1, bool bSetCount=true)
Sets a number of items within the Blob's data.
Definition: Blob.cs:1922

MyCaffe.common.Blob.mutable_gpu_diff
long mutable_gpu_diff
Returns the diff GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1555

MyCaffe.common.Blob.mutable_gpu_data
long mutable_gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1487

MyCaffe.common.Blob.Reshape
void Reshape(int nNum, int nChannels, int nHeight, int nWidth, bool? bUseHalfSize=null)
DEPRECIATED; use
Definition: Blob.cs:442

MyCaffe.common.Blob.count
int count()
Returns the total number of items in the Blob.
Definition: Blob.cs:739

MyCaffe.common.Blob.ReshapeLike
void ReshapeLike(Blob< T > b, bool? bUseHalfSize=null)
Reshape this Blob to have the same shape as another Blob.
Definition: Blob.cs:648

MyCaffe.common.Blob.Name
string Name
Get/set the name of the Blob.
Definition: Blob.cs:2184

MyCaffe.common.Blob.gpu_diff
long gpu_diff
Returns the diff GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1541

MyCaffe.common.Blob.Dispose
virtual void Dispose(bool bDisposing)
Releases all resources used by the Blob (including both GPU and Host).
Definition: Blob.cs:402

MyCaffe.common.Blob.num
int num
DEPRECIATED; legacy shape accessor num: use shape(0) instead.
Definition: Blob.cs:792

MyCaffe.common.Blob.gpu_data
long gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1479

MyCaffe.common.CudaDnn
The CudaDnn object is the main interface to the Low-Level Cuda C++ DLL.
Definition: CudaDnn.cs:969

MyCaffe.layers.EltwiseLayer
The EltwiseLayer computes elementwise oeprations, such as product and sum, along multiple input blobs...
Definition: EltwiseLayer.cs:23

MyCaffe.layers.EltwiseLayer.LayerSetUp
override void LayerSetUp(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Setup the layer.
Definition: EltwiseLayer.cs:93

MyCaffe.layers.EltwiseLayer.EltwiseLayer
EltwiseLayer(CudaDnn< T > cuda, Log log, LayerParameter p)
The EltwiseLayer constructor.
Definition: EltwiseLayer.cs:44

MyCaffe.layers.EltwiseLayer.forward
override void forward(BlobCollection< T > colBottom, BlobCollection< T > colTop)
The Forward computation.
Definition: EltwiseLayer.cs:192

MyCaffe.layers.EltwiseLayer.ExactNumTopBlobs
override int ExactNumTopBlobs
Returns the exact number of required top (output) Blobs: output (result of eltwise operation in input...
Definition: EltwiseLayer.cs:84

MyCaffe.layers.EltwiseLayer.MinBottomBlobs
override int MinBottomBlobs
Returns the minimum required number of bottom (input) Blobs: input1, input2
Definition: EltwiseLayer.cs:76

MyCaffe.layers.EltwiseLayer.dispose
override void dispose()
Releases all GPU and host resources used by the Layer.
Definition: EltwiseLayer.cs:53

MyCaffe.layers.EltwiseLayer.backward
override void backward(BlobCollection< T > colTop, List< bool > rgbPropagateDown, BlobCollection< T > colBottom)
Computes the error gradient w.r.t. the input.
Definition: EltwiseLayer.cs:316

MyCaffe.layers.EltwiseLayer.Reshape
override void Reshape(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Reshape the bottom (input) and top (output) blobs.
Definition: EltwiseLayer.cs:131

MyCaffe.layers.EltwiseLayer.setup_internal_blobs
override void setup_internal_blobs(BlobCollection< T > col)
Derivative layers should add all internal blobws to the 'col' provided.
Definition: EltwiseLayer.cs:64

MyCaffe.layers.Layer
An interface for the units of computation which can be composed into a Net.
Definition: Layer.cs:31

MyCaffe.layers.Layer.m_log
Log m_log
Specifies the Log for output.
Definition: Layer.cs:43

MyCaffe.layers.Layer.m_param
LayerParameter m_param
Specifies the LayerParameter describing the Layer.
Definition: Layer.cs:47

MyCaffe.layers.Layer.m_cuda
CudaDnn< T > m_cuda
Specifies the CudaDnn connection to Cuda.
Definition: Layer.cs:39

MyCaffe.layers.Layer.m_type
LayerParameter.LayerType m_type
Specifies the Layer type.
Definition: Layer.cs:35

MyCaffe.layers.Layer.layer_param
LayerParameter layer_param
Returns the LayerParameter for this Layer.
Definition: Layer.cs:899

MyCaffe.param.EltwiseParameter
Specifies the parameters for the EltwiseLayer.
Definition: EltwiseParameter.cs:22

MyCaffe.param.EltwiseParameter.EltwiseOp
EltwiseOp
Defines the operation to perform.
Definition: EltwiseParameter.cs:27

MyCaffe.param.EltwiseParameter.allow_single_batch_input
bool allow_single_batch_input
Specifies whether to allow single batch input for the second input (default = false).
Definition: EltwiseParameter.cs:80

MyCaffe.param.EltwiseParameter.coeff
List< double > coeff
Specifies the blob-wise coefficient for SUM operation.
Definition: EltwiseParameter.cs:90

MyCaffe.param.EltwiseParameter.stable_prod_grad
bool stable_prod_grad
Specifies whether or not to use an asymptotically slower (for > 2 inputs) but stabler method of compu...
Definition: EltwiseParameter.cs:101

MyCaffe.param.EltwiseParameter.operation
EltwiseOp operation
Specifies the element-wise operation.
Definition: EltwiseParameter.cs:70

MyCaffe.param.EltwiseParameter.coeff_blob
bool coeff_blob
If true and the EltwiseOp is SUM, the last bottom blob is a singleton coefficient for the first N-1 b...
Definition: EltwiseParameter.cs:112

MyCaffe.param.LayerParameter
Specifies the base parameter for all layers.
Definition: LayerParameter.cs:24

MyCaffe.param.LayerParameter.name
string name
Specifies the name of this LayerParameter.
Definition: LayerParameter.cs:1865

MyCaffe.param.LayerParameter.eltwise_param
EltwiseParameter eltwise_param
Returns the parameter set when initialized with LayerType.ELTWISE
Definition: LayerParameter.cs:2308

MyCaffe.param.LayerParameter.LayerType
LayerType
Specifies the layer type.
Definition: LayerParameter.cs:110

MyCaffe.basecode
The MyCaffe.basecode contains all generic types used throughout MyCaffe.
Definition: Annotation.cs:12

MyCaffe.common
The MyCaffe.common namespace contains common MyCaffe classes.
Definition: BatchInput.cs:8

MyCaffe.layers
The MyCaffe.layers namespace contains all layers that have a solidified code base,...
Definition: LayerFactory.cs:15

MyCaffe.param
The MyCaffe.param namespace contains parameters used to create models.
Definition: AttentionParameter.cs:9

MyCaffe
The MyCaffe namespace contains the main body of MyCaffe code that closesly tracks the C++ Caffe open-...
Definition: Annotation.cs:12

System
Definition: Component.cs:11