mycaffe/html/_im2col_layer_8cs_source.html

using System;

using System.Collections.Generic;

using System.Linq;

using System.Text;

using System.Drawing;

using MyCaffe.basecode;

using MyCaffe.common;

using MyCaffe.param;


namespace MyCaffe.layers

{

    public class Im2colLayer<T> : Layer<T>

    {

        Blob<T> m_blobKernelShape;

        Blob<T> m_blobStride;

        Blob<T> m_blobPad;

        Blob<T> m_blobDilation;

        int m_nNumSpatialAxes;

        int m_nBottomDim;

        int m_nTopDim;

        int m_nChannelAxis;

        int m_nNum;

        int m_nChannels;

        bool m_bForceNDIm2Col;


        public Im2colLayer(CudaDnn<T> cuda, Log log, LayerParameter p)

            : base(cuda, log, p)

        {

            m_type = LayerParameter.LayerType.IM2COL;

            log.CHECK(p.type == LayerParameter.LayerType.IM2COL, "The layer type should be IM2COL.");


            m_blobKernelShape = new Blob<T>(cuda, log);

            m_blobStride = new Blob<T>(cuda, log);

            m_blobPad = new Blob<T>(cuda, log);

            m_blobDilation = new Blob<T>(cuda, log);

        }


        protected override void dispose()

        {

            m_blobKernelShape.Dispose();

            m_blobStride.Dispose();

            m_blobPad.Dispose();

            m_blobDilation.Dispose();

        }


        public override int ExactNumBottomBlobs

        {

            get { return 1; }

        }


        public override int ExactNumTopBlobs

        {

            get { return 1; }

        }


        public override void LayerSetUp(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            ConvolutionParameter p = m_param.convolution_param;


            m_bForceNDIm2Col = p.force_nd_im2col;

            int nInputNumDims = colBottom[0].shape().Count;

            m_nChannelAxis = colBottom[0].CanonicalAxisIndex(p.axis);

            int nFirstSpatialDim = m_nChannelAxis + 1;

            m_nNumSpatialAxes = nInputNumDims - nFirstSpatialDim;


            m_log.CHECK_GE(m_nNumSpatialAxes, 1, "The spatial axis count must be >= 1.");


            List<int> rgDimBlobShape = new List<int>() { m_nNumSpatialAxes };


            // Setup filter kernel dimensions (kernel_shape_).

            m_blobKernelShape.Reshape(rgDimBlobShape);


            T[] rgKernelShape = m_blobKernelShape.mutable_cpu_data;


            if (p.kernel_h.HasValue || p.kernel_w.HasValue)

            {

                m_log.CHECK_EQ(m_nNumSpatialAxes, 2, "kernel_h & kernel_w can only be used for 2D convolution.");

                m_log.CHECK_EQ(0, p.kernel_size.Count, "Either kernel_size or kernel_h/w should be specified; not both.");

                rgKernelShape[0] = (T)Convert.ChangeType(p.kernel_h.Value, typeof(T));

                rgKernelShape[1] = (T)Convert.ChangeType(p.kernel_w.Value, typeof(T));

            }

            else

            {

                int nNumKernelDims = p.kernel_size.Count;

                m_log.CHECK(nNumKernelDims == 1 || nNumKernelDims == m_nNumSpatialAxes, "kernel_size must be specified once, or once per spatial dimension (kernel_size specified " + nNumKernelDims.ToString() + " times; " + m_nNumSpatialAxes.ToString() + " spatial dims);");


                for (int i = 0; i < m_nNumSpatialAxes; i++)

                {

                    uint nKernel = p.kernel_size[(nNumKernelDims == 1) ? 0 : i];

                    rgKernelShape[i] = (T)Convert.ChangeType(nKernel, typeof(T));

                }

            }


            for (int i = 0; i < m_nNumSpatialAxes; i++)

            {

                int nVal = (int)Convert.ChangeType(rgKernelShape[i], typeof(int));

                m_log.CHECK_GT(nVal, 0, "Filter dimensions must be nonzero.");

            }


            m_blobKernelShape.mutable_cpu_data = rgKernelShape;


            // Setup stride dimensions (stride_).

            m_blobStride.Reshape(rgDimBlobShape);


            T[] rgStrideData = m_blobStride.mutable_cpu_data;


            if (p.stride_h.HasValue || p.stride_w.HasValue)

            {

                m_log.CHECK_EQ(m_nNumSpatialAxes, 2, "stride_h & stride_w can only be used for 2D convolution.");

                m_log.CHECK_EQ(0, p.stride.Count, "Either stride or stride_h/w should be specified; not both.");

                rgStrideData[0] = (T)Convert.ChangeType(p.stride_h.Value, typeof(T));

                rgStrideData[1] = (T)Convert.ChangeType(p.stride_w.Value, typeof(T));

            }

            else

            {

                int nNumStrideDims = p.stride.Count;

                m_log.CHECK(nNumStrideDims == 0 || nNumStrideDims == 1 || nNumStrideDims == m_nNumSpatialAxes, "stride must be specified once, or once per spatial dimension (stride specified " + nNumStrideDims.ToString() + " times; " + m_nNumSpatialAxes.ToString() + " spatial dims);");


                uint nDefaultStride = 1;

                for (int i = 0; i < m_nNumSpatialAxes; i++)

                {

                    uint nStride = (nNumStrideDims == 0) ? nDefaultStride :

                                                           p.stride[(nNumStrideDims == 1) ? 0 : i];


                    rgStrideData[i] = (T)Convert.ChangeType(nStride, typeof(T));

                }

            }


            m_blobStride.mutable_cpu_data = rgStrideData;


            // Setup pad dimensions (pad_).

            m_blobPad.Reshape(rgDimBlobShape);


            T[] rgPadData = m_blobPad.mutable_cpu_data;


            if (p.pad_h.HasValue || p.pad_w.HasValue)

            {

                m_log.CHECK_EQ(m_nNumSpatialAxes, 2, "pad_h & pad_w can only be used for 2D convolution.");

                m_log.CHECK_EQ(0, p.pad.Count, "Either pad or pad_h/w should be specified; not both.");

                rgPadData[0] = (T)Convert.ChangeType(p.pad_h.Value, typeof(T));

                rgPadData[1] = (T)Convert.ChangeType(p.pad_w.Value, typeof(T));

            }

            else

            {

                int nNumPadDims = p.pad.Count;

                m_log.CHECK(nNumPadDims == 0 || nNumPadDims == 1 || nNumPadDims == m_nNumSpatialAxes, "pad must be specified once, or once per spatial dimension (pad specified " + nNumPadDims.ToString() + " times; " + m_nNumSpatialAxes.ToString() + " spatial dims);");


                uint nDefaultPad = 0;

                for (int i = 0; i < m_nNumSpatialAxes; i++)

                {

                    uint nPad = (nNumPadDims == 0) ? nDefaultPad :

                                                     p.pad[(nNumPadDims == 1) ? 0 : i];


                    rgPadData[i] = (T)Convert.ChangeType(nPad, typeof(T));

                }

            }


            m_blobPad.mutable_cpu_data = rgPadData;


            // Setup dilation dimensions (dilation_).

            m_blobDilation.Reshape(rgDimBlobShape);


            T[] rgDilationData = m_blobDilation.mutable_cpu_data;


            int nNumDilationDims = p.dilation.Count;

            m_log.CHECK(nNumDilationDims == 0 || nNumDilationDims == 1 || nNumDilationDims == m_nNumSpatialAxes, "dilation must be specified once, or once per spatial dimension (dilation specified " + nNumDilationDims.ToString() + " times; " + m_nNumSpatialAxes.ToString() + " spatial dims);");


            uint nDefaultDilation = 1;

            for (int i = 0; i < m_nNumSpatialAxes; i++)

            {

                uint nPad = (nNumDilationDims == 0) ? nDefaultDilation :

                                                 p.dilation[(nNumDilationDims == 1) ? 0 : i];


                rgDilationData[i] = (T)Convert.ChangeType(nPad, typeof(T));

            }


            m_blobDilation.mutable_cpu_data = rgDilationData;

        }


        public override void Reshape(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            List<int> rgTopShape = Utility.Clone<int>(colBottom[0].shape());

            T[] rgKernelShapeData = m_blobKernelShape.update_cpu_data();

            T[] rgStrideData = m_blobStride.update_cpu_data();

            T[] rgPadData = m_blobPad.update_cpu_data();

            T[] rgDilationData = m_blobDilation.update_cpu_data();


            for (int i = 0; i < m_nNumSpatialAxes; i++)

            {

                int nKernel = val_at(rgKernelShapeData, i);

                int nStride = val_at(rgStrideData, i);

                int nPad = val_at(rgPadData, i);

                int nDilation = val_at(rgDilationData, i);


                rgTopShape[m_nChannelAxis] *= nKernel;

                int nInputDim = colBottom[0].shape()[m_nChannelAxis + i + 1];

                int nKernelExtent = nDilation * (nKernel - 1) + 1;

                int nOutputDim = (nInputDim + 2 * nPad - nKernelExtent) / nStride + 1;

                rgTopShape[m_nChannelAxis + i + 1] = nOutputDim;

            }


            colTop[0].Reshape(rgTopShape);

            m_nNum = colBottom[0].count(0, m_nChannelAxis);

            m_nBottomDim = colBottom[0].count(m_nChannelAxis);

            m_nTopDim = colTop[0].count(m_nChannelAxis);

            m_nChannels = colBottom[0].shape(m_nChannelAxis);

        }


        protected override void forward(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            long hBottomData = colBottom[0].gpu_data;

            long hTopData = colTop[0].mutable_gpu_data;


            if (!m_bForceNDIm2Col && m_nNumSpatialAxes == 2)

            {

                Size szKernel = size_at(m_blobKernelShape);

                Size szStride = size_at(m_blobStride);

                Size szPad = size_at(m_blobPad);

                Size szDilation = size_at(m_blobDilation);


                for (int n = 0; n < m_nNum; n++)

                {

                    m_cuda.im2col(hBottomData,

                                  n * m_nBottomDim,

                                  m_nChannels,

                                  colBottom[0].shape(m_nChannelAxis + 1),

                                  colBottom[0].shape(m_nChannelAxis + 2),

                                  szKernel.Height, szKernel.Width,

                                  szPad.Height, szPad.Width,

                                  szStride.Height, szStride.Width,

                                  szDilation.Height, szDilation.Width,

                                  hTopData,

                                  n * m_nTopDim);

                }

            }

            else

            {

                int nNumKernels = m_nChannels * colTop[0].count(m_nChannelAxis + 1);

                long hKernelShape = m_blobKernelShape.gpu_data;

                long hStride = m_blobStride.gpu_data;

                long hPad = m_blobPad.gpu_data;

                long hDilation = m_blobDilation.gpu_data;


                for (int n = 0; n < m_nNum; n++)

                {

                    m_cuda.im2col_nd(hBottomData,

                                  n * m_nBottomDim,

                                  m_nNumSpatialAxes,

                                  nNumKernels,

                                  m_nChannelAxis,

                                  colBottom[0].gpu_shape,

                                  colTop[0].gpu_shape,

                                  hKernelShape,

                                  hPad,

                                  hStride,

                                  hDilation,

                                  hTopData,

                                  n * m_nTopDim);

                }

            }

        }


        protected override void backward(BlobCollection<T> colTop, List<bool> rgbPropagateDown, BlobCollection<T> colBottom)

        {

            long hTopDiff = colTop[0].gpu_diff;

            long hBottomDiff = colBottom[0].mutable_gpu_diff;


            if (!m_bForceNDIm2Col && m_nNumSpatialAxes == 2)

            {

                Size szKernel = size_at(m_blobKernelShape);

                Size szStride = size_at(m_blobStride);

                Size szPad = size_at(m_blobPad);

                Size szDilation = size_at(m_blobDilation);


                for (int n = 0; n < m_nNumSpatialAxes; n++)

                {

                    m_cuda.col2im(hTopDiff,

                                  n * m_nTopDim,

                                  m_nChannels,

                                  colBottom[0].shape()[m_nChannelAxis + 1],

                                  colBottom[0].shape()[m_nChannelAxis + 2],

                                  szKernel.Height, szKernel.Width,

                                  szPad.Height, szPad.Width,

                                  szStride.Height, szStride.Width,

                                  szDilation.Height, szDilation.Width,

                                  hBottomDiff,

                                  n * m_nBottomDim);

                }

            }

            else

            {

                long hKernelShape = m_blobKernelShape.gpu_data;

                long hStride = m_blobStride.gpu_data;

                long hPad = m_blobPad.gpu_data;

                long hDilation = m_blobDilation.gpu_data;


                for (int n = 0; n < m_nNumSpatialAxes; n++)

                {

                    m_cuda.col2im_nd(hTopDiff,

                                  n * m_nTopDim,

                                  m_nNumSpatialAxes,

                                  m_nBottomDim,

                                  m_nChannelAxis,

                                  colBottom[0].gpu_shape,

                                  colTop[0].gpu_shape,

                                  hKernelShape,

                                  hPad,

                                  hStride,

                                  hDilation,

                                  hBottomDiff,

                                  n * m_nBottomDim);

                }

            }

        }

    }

}

MyCaffe.basecode.Log
The Log class provides general output in text form.
Definition: Log.cs:13

MyCaffe.basecode.Log.CHECK
void CHECK(bool b, string str)
Test a flag for true.
Definition: Log.cs:227

MyCaffe.basecode.Log.CHECK_EQ
void CHECK_EQ(double df1, double df2, string str)
Test whether one number is equal to another.
Definition: Log.cs:239

MyCaffe.basecode.Log.CHECK_GT
void CHECK_GT(double df1, double df2, string str)
Test whether one number is greater than another.
Definition: Log.cs:299

MyCaffe.basecode.Log.CHECK_GE
void CHECK_GE(double df1, double df2, string str)
Test whether one number is greater than or equal to another.
Definition: Log.cs:287

MyCaffe.basecode.Utility
The Utility class provides general utility funtions.
Definition: Utility.cs:35

MyCaffe.common.BlobCollection
The BlobCollection contains a list of Blobs.
Definition: BlobCollection.cs:16

MyCaffe.common.BlobCollection.Count
int Count
Returns the number of items in the collection.
Definition: BlobCollection.cs:30

MyCaffe.common.BlobCollection.Reshape
void Reshape(int[] rgShape)
Reshapes all blobs in the collection to the given shape.
Definition: BlobCollection.cs:238

MyCaffe.common.Blob
The Blob is the main holder of data that moves through the Layers of the Net.
Definition: Blob.cs:25

MyCaffe.common.Blob.mutable_cpu_data
T[] mutable_cpu_data
Get data from the GPU and bring it over to the host, or Set data from the Host and send it over to th...
Definition: Blob.cs:1461

MyCaffe.common.Blob.Reshape
void Reshape(int nNum, int nChannels, int nHeight, int nWidth, bool? bUseHalfSize=null)
DEPRECIATED; use
Definition: Blob.cs:442

MyCaffe.common.Blob.update_cpu_data
T[] update_cpu_data()
Update the CPU data by transferring the GPU data over to the Host.
Definition: Blob.cs:1470

MyCaffe.common.Blob.Dispose
virtual void Dispose(bool bDisposing)
Releases all resources used by the Blob (including both GPU and Host).
Definition: Blob.cs:402

MyCaffe.common.Blob.gpu_data
long gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1479

MyCaffe.common.CudaDnn
The CudaDnn object is the main interface to the Low-Level Cuda C++ DLL.
Definition: CudaDnn.cs:969

MyCaffe.layers.Im2colLayer
The Im2ColLayer is a helper layer for image operations that rearranges image regions into column vect...
Definition: Im2colLayer.cs:24

MyCaffe.layers.Im2colLayer.backward
override void backward(BlobCollection< T > colTop, List< bool > rgbPropagateDown, BlobCollection< T > colBottom)
Computes the error gradient w.r.t. the forwarded inputs.
Definition: Im2colLayer.cs:330

MyCaffe.layers.Im2colLayer.LayerSetUp
override void LayerSetUp(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Setup the layer.
Definition: Im2colLayer.cs:97

MyCaffe.layers.Im2colLayer.Reshape
override void Reshape(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Reshape the bottom (input) and top (output) blobs.
Definition: Im2colLayer.cs:229

MyCaffe.layers.Im2colLayer.Im2colLayer
Im2colLayer(CudaDnn< T > cuda, Log log, LayerParameter p)
The Im2col constructor.
Definition: Im2colLayer.cs:55

MyCaffe.layers.Im2colLayer.dispose
override void dispose()
Releases all GPU and host resources used by the Layer.
Definition: Im2colLayer.cs:68

MyCaffe.layers.Im2colLayer.forward
override void forward(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Forward computation.
Definition: Im2colLayer.cs:268

MyCaffe.layers.Im2colLayer.ExactNumTopBlobs
override int ExactNumTopBlobs
Returns the exact number of required top (output) Blobs: im2col.
Definition: Im2colLayer.cs:88

MyCaffe.layers.Im2colLayer.ExactNumBottomBlobs
override int ExactNumBottomBlobs
Returns the exact number of required bottom (input) Blobs: input.
Definition: Im2colLayer.cs:80

MyCaffe.layers.Layer
An interface for the units of computation which can be composed into a Net.
Definition: Layer.cs:31

MyCaffe.layers.Layer.m_log
Log m_log
Specifies the Log for output.
Definition: Layer.cs:43

MyCaffe.layers.Layer.m_param
LayerParameter m_param
Specifies the LayerParameter describing the Layer.
Definition: Layer.cs:47

MyCaffe.layers.Layer.val_at
int val_at(T[] rg, int nIdx)
Returns the integer value at a given index in a generic array.
Definition: Layer.cs:1434

MyCaffe.layers.Layer.size_at
Size size_at(Blob< T > b)
Returns the Size of a given two element Blob, such as one that stores Blob size information.
Definition: Layer.cs:1444

MyCaffe.layers.Layer.m_cuda
CudaDnn< T > m_cuda
Specifies the CudaDnn connection to Cuda.
Definition: Layer.cs:39

MyCaffe.layers.Layer.m_type
LayerParameter.LayerType m_type
Specifies the Layer type.
Definition: Layer.cs:35

MyCaffe.param.ConvolutionParameter
Specifies the parameters for the ConvolutionLayer. The default weight filler is set to the XavierFill...
Definition: ConvolutionParameter.cs:24

MyCaffe.param.ConvolutionParameter.force_nd_im2col
bool force_nd_im2col
Whether to force use of the general ND convolution, even if a specific implementation for blobs of th...
Definition: ConvolutionParameter.cs:190

MyCaffe.param.ConvolutionParameter.axis
int axis
The axis to interpret as 'channels' when performing convolution. Preceding dimensions are treated as ...
Definition: ConvolutionParameter.cs:176

MyCaffe.param.KernelParameter.stride_h
uint? stride_h
The stride height (2D only)
Definition: KernelParameter.cs:124

MyCaffe.param.KernelParameter.kernel_size
List< uint > kernel_size
Kernel size is given as a single value for equal dimensions in all spatial dimensions,...
Definition: KernelParameter.cs:63

MyCaffe.param.KernelParameter.dilation
List< uint > dilation
Factor used to dilate the kernel, (implicitly) zero-filling the resulting holes. (Kernel dilation is ...
Definition: KernelParameter.cs:82

MyCaffe.param.KernelParameter.stride_w
uint? stride_w
The stride width (2D only)
Definition: KernelParameter.cs:138

MyCaffe.param.KernelParameter.pad_h
uint? pad_h
The padding height (2D only)
Definition: KernelParameter.cs:96

MyCaffe.param.KernelParameter.kernel_h
uint? kernel_h
The kernel height (2D only)
Definition: KernelParameter.cs:152

MyCaffe.param.KernelParameter.stride
List< uint > stride
Stride is given as a single value for equal dimensions in all spatial dimensions, or once per spatial...
Definition: KernelParameter.cs:52

MyCaffe.param.KernelParameter.kernel_w
uint? kernel_w
The kernel width (2D only)
Definition: KernelParameter.cs:166

MyCaffe.param.KernelParameter.pad_w
uint? pad_w
The padding width (2D only)
Definition: KernelParameter.cs:110

MyCaffe.param.KernelParameter.pad
List< uint > pad
Pad is given as a single value for equal dimensions in all spatial dimensions, or once per spatial di...
Definition: KernelParameter.cs:41

MyCaffe.param.LayerParameter
Specifies the base parameter for all layers.
Definition: LayerParameter.cs:24

MyCaffe.param.LayerParameter.convolution_param
ConvolutionParameter convolution_param
Returns the parameter set when initialized with LayerType.CONVOLUTION
Definition: LayerParameter.cs:2126

MyCaffe.param.LayerParameter.type
LayerType type
Specifies the type of this LayerParameter.
Definition: LayerParameter.cs:1874

MyCaffe.param.LayerParameter.LayerType
LayerType
Specifies the layer type.
Definition: LayerParameter.cs:110

MyCaffe.basecode
The MyCaffe.basecode contains all generic types used throughout MyCaffe.
Definition: Annotation.cs:12

MyCaffe.common
The MyCaffe.common namespace contains common MyCaffe classes.
Definition: BatchInput.cs:8

MyCaffe.layers
The MyCaffe.layers namespace contains all layers that have a solidified code base,...
Definition: LayerFactory.cs:15

MyCaffe.param
The MyCaffe.param namespace contains parameters used to create models.
Definition: AttentionParameter.cs:9

MyCaffe
The MyCaffe namespace contains the main body of MyCaffe code that closesly tracks the C++ Caffe open-...
Definition: Annotation.cs:12

System
Definition: Component.cs:11