mycaffe/html/_gelu_layer_8cs_source.html

using System;

using System.Collections.Generic;

using System.Linq;

using System.Text;

using MyCaffe.basecode;

using MyCaffe.common;

using MyCaffe.param;


namespace MyCaffe.layers.gpt

{

    public class GeluLayer<T> : NeuronLayer<T>

    {

        bool m_bEnableBertVersion;


        public GeluLayer(CudaDnn<T> cuda, Log log, LayerParameter p)

            : base(cuda, log, p)

        {

            m_type = LayerParameter.LayerType.GELU;

            m_bEnableBertVersion = p.gelu_param.enable_bert_version;

        }


        protected override void forward(BlobCollection<T> colBottom, BlobCollection<T> colTop)

        {

            long hBottomData = colBottom[0].gpu_data;

            long hTopData = colTop[0].mutable_gpu_data;

            int nCount = colBottom[0].count();


            m_cuda.gelu_fwd(nCount, hBottomData, hTopData, m_bEnableBertVersion);

        }


        protected override void backward(BlobCollection<T> colTop, List<bool> rgbPropagateDown, BlobCollection<T> colBottom)

        {

            long hTopData = colTop[0].gpu_data;

            long hTopDiff = colTop[0].gpu_diff;

            long hBottomDiff = colBottom[0].mutable_gpu_diff;

            long hBottomData = colBottom[0].gpu_data;

            int nCount = colBottom[0].count();


            m_cuda.gelu_bwd(nCount, hTopDiff, hTopData, hBottomDiff, hBottomData, m_bEnableBertVersion);

        }

    }

}

MyCaffe.basecode.Log
The Log class provides general output in text form.
Definition: Log.cs:13

MyCaffe.common.BlobCollection
The BlobCollection contains a list of Blobs.
Definition: BlobCollection.cs:16

MyCaffe.common.CudaDnn
The CudaDnn object is the main interface to the Low-Level Cuda C++ DLL.
Definition: CudaDnn.cs:969

MyCaffe.layers.Layer.m_cuda
CudaDnn< T > m_cuda
Specifies the CudaDnn connection to Cuda.
Definition: Layer.cs:39

MyCaffe.layers.Layer.m_type
LayerParameter.LayerType m_type
Specifies the Layer type.
Definition: Layer.cs:35

MyCaffe.layers.NeuronLayer
The NeuronLayer is an interface for layers that take one blob as input (x) and produce only equally-s...
Definition: NeuronLayer.cs:22

MyCaffe.layers.gpt.GeluLayer
The GeluLayer implements the New GELU activation function currently in Google BERT repo (same as Open...
Definition: GeluLayer.cs:24

MyCaffe.layers.gpt.GeluLayer.backward
override void backward(BlobCollection< T > colTop, List< bool > rgbPropagateDown, BlobCollection< T > colBottom)
Computes the error gradient w.r.t. the GELU value inputs.
Definition: GeluLayer.cs:79

MyCaffe.layers.gpt.GeluLayer.forward
override void forward(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Forward computation
Definition: GeluLayer.cs:53

MyCaffe.layers.gpt.GeluLayer.GeluLayer
GeluLayer(CudaDnn< T > cuda, Log log, LayerParameter p)
The GeluLayer constructor.
Definition: GeluLayer.cs:33

MyCaffe.param.LayerParameter
Specifies the base parameter for all layers.
Definition: LayerParameter.cs:24

MyCaffe.param.LayerParameter.LayerType
LayerType
Specifies the layer type.
Definition: LayerParameter.cs:110

MyCaffe.param.LayerParameter.gelu_param
GeluParameter gelu_param
Returns the parameter set when initialized with LayerType.GELU
Definition: LayerParameter.cs:2371

MyCaffe.basecode
The MyCaffe.basecode contains all generic types used throughout MyCaffe.
Definition: Annotation.cs:12

MyCaffe.common
The MyCaffe.common namespace contains common MyCaffe classes.
Definition: BatchInput.cs:8

MyCaffe.layers.gpt
The MyCaffe.layers.gpt namespace contains all GPT related layers.
Definition: LayerFactory.cs:15

MyCaffe.param
The MyCaffe.param namespace contains parameters used to create models.
Definition: AttentionParameter.cs:9

MyCaffe
The MyCaffe namespace contains the main body of MyCaffe code that closesly tracks the C++ Caffe open-...
Definition: Annotation.cs:12

System
Definition: Component.cs:11