mycaffe/html/_compute_graph_8cs_source.html

using MyCaffe.basecode;

using System;

using System.Collections.Generic;

using System.Diagnostics;

using System.Linq;

using System.Text;

using System.Threading.Tasks;


namespace MyCaffe.common

{

    public class ComputeGraph<T> : IDisposable

    {

        Blob<T> m_blobWork;

        CudaDnn<T> m_cuda;

        Log m_log;

        List<Tuple<string, Action>> m_rgBackprop = new List<Tuple<string, Action>>();

        Dictionary<string, Blob<T>[]> m_rgDebug = new Dictionary<string, Blob<T>[]>();

        bool m_bNeedsBackprop = true;

        bool m_bCheckForNans = false;

        bool m_bClipGradients = false;

        bool m_bAddDebug = false;

        int m_nAxis = 0;

        string m_strMarker = null;


        public ComputeGraph(CudaDnn<T> cuda, Log log, int nAxis, bool bNeedsBackprop = true, bool bClipGradients = false, bool bCheckNans = false, bool bAddDebug = false)

        {

            m_cuda = cuda;

            m_log = log;

            m_blobWork = new Blob<T>(cuda, log);

            m_bNeedsBackprop = bNeedsBackprop;

            m_bCheckForNans = bCheckNans;

            m_bClipGradients = bClipGradients;

            m_bAddDebug = bAddDebug;

            m_nAxis = nAxis;

        }


        public void Dispose()

        {

            if (m_blobWork != null)

            {

                m_blobWork.Dispose();

                m_blobWork = null;

            }

        }


        private void add_debug(string str, params Blob<T>[] rg)

        {

            string strName = m_rgDebug.Count.ToString() + "_" + str;

            m_rgDebug.Add(strName, rg);

        }


        public Dictionary<string, Blob<T>[]> Debug

        {

            get { return m_rgDebug; }

        }


        public string marker

        {

            get { return m_strMarker; }

            set { m_strMarker = value; }

        }


        public bool needs_backprop

        {

            get { return m_bNeedsBackprop; }

            set { m_bNeedsBackprop = value; }

        }


        public int axis

        {

            get { return m_nAxis; }

        }


        private Blob<T> work

        {

            get { return m_blobWork; }

        }


        private int input_count(Blob<T> b)

        {

            if (b.num_axes <= m_nAxis + 2)

                return 1;


            return b.count(m_nAxis + 2);

        }


        private void clip_gradient1(Blob<T> b)

        {

            float[] rg = Utility.ConvertVecF<T>(b.mutable_cpu_diff);


            for (int i = 0; i < rg.Length; i++)

            {

                if (Math.Abs(rg[i]) < 0.000001)

                    rg[i] = 0;

                else

                    rg[i] = (float)Math.Round(rg[i], 7);

            }


            b.mutable_cpu_diff = Utility.ConvertVec<T>(rg);

        }


        private void clip_gradient(params Blob<T>[] rg)

        {

            foreach (Blob<T> b in rg)

            {

                clip_gradient1(b);

            }

        }


        private T[] round(T[] rgData1, int nDecimals)

        {

            float[] rgData = Utility.ConvertVecF<T>(rgData1);


            for (int i = 0; i < rgData.Length; i++)

            {

                rgData[i] = (float)Math.Round(rgData[i], nDecimals);

            }


            return Utility.ConvertVec<T>(rgData);

        }


        private void check_nan(params Blob<T>[] rg)

        {

            for (int i = 0; i < rg.Length; i++)

            {

                work.ReshapeLike(rg[i]);

                Tuple<double, double, double, double> data = rg[i].minmax_data(work, true);

                Tuple<double, double, double, double> diff = rg[i].minmax_diff(work, true);


                double dfDataNanCount = data.Item3;

                double dfDataInfCount = data.Item4;

                double dfDiffNanCount = diff.Item3;

                double dfDiffInfCount = diff.Item4;


                if (dfDataNanCount > 0 || dfDataInfCount > 0)

                    throw new Exception("NAN or INF detected in " + rg[i].Name + " data!");


                if (dfDataNanCount > 0 || dfDataInfCount > 0)

                    throw new Exception("NAN or INF detected in " + rg[i].Name + " diff!");

            }

        }


        private void apply(Blob<T> work, Blob<T> btm)

        {

            m_cuda.add(btm.count(), work.gpu_diff, btm.gpu_diff, btm.mutable_gpu_diff);

        }


        public void DebugOp(params Blob<T>[] rgB)

        {

            string strMarker = marker;

            Action backward = () =>

            {

                string str = "";

                for (int i = 0; i < rgB.Length; i++)

                {

                    str += rgB[i].Name + ",";

                }

                str = str.TrimEnd(',');


                Trace.WriteLine("Debugging at " + strMarker + " blobs: " + str);

            };

            m_rgBackprop.Add(new Tuple<string, Action>(m_strMarker, backward));

        }


        public Blob<T> Round(Blob<T> b, int nDecimals = 6)

        {

            b.mutable_cpu_data = round(b.mutable_cpu_data, nDecimals);


            if (m_bNeedsBackprop)

            {

                Action backward = () =>

                {

                    b.mutable_cpu_diff = round(b.mutable_cpu_diff, nDecimals);

                };

                m_rgBackprop.Add(new Tuple<string, Action>(m_strMarker, backward));

            }


            return b;

        }


        public Blob<T> PeekRow(Blob<T> btm, Blob<T> top, int ix)

        {

            string strMarker = marker;

            List<int> rgShape = new List<int>() { 1, 1 };

            rgShape[1] = btm.count(m_nAxis + 1);

            top.Reshape(rgShape);


            int nSpatialDim = btm.count(m_nAxis + 1);

            m_cuda.copy(nSpatialDim, btm.gpu_data, top.mutable_gpu_data, nSpatialDim * ix, 0);


            if (m_bNeedsBackprop)

            {

                Action backward = () =>

                {

                    m_cuda.copy(nSpatialDim, top.gpu_diff, btm.mutable_gpu_diff, 0, nSpatialDim * ix);

                    m_cuda.copy(nSpatialDim, top.gpu_data, btm.mutable_gpu_data, 0, nSpatialDim * ix);


                    if (m_bCheckForNans)

                        check_nan(btm);

                };

                m_rgBackprop.Add(new Tuple<string, Action>(m_strMarker, backward));

            }


            return top;

        }


        public void PeekItem(Blob<T> btm, Blob<T> top, int ix)

        {

            string strMarker = marker;

            int nSpatialDim = btm.count(m_nAxis);


            m_cuda.copy(nSpatialDim, btm.gpu_data, top.mutable_gpu_data, 0, nSpatialDim * ix);


            if (m_bNeedsBackprop)

            {

                Action backward = () =>

                {

                    btm.Reshape(1, 1, 1, 1);

                    m_cuda.copy(nSpatialDim, top.gpu_diff, btm.mutable_gpu_diff, nSpatialDim * ix, 0);

                };

                m_rgBackprop.Add(new Tuple<string, Action>(m_strMarker, backward));

            }

        }


        public Blob<T> CopyToRow(Blob<T> btm, Blob<T> top, int ix, bool bCopyDiff = false)

        {

            string strMarker = marker;

            int nSpatialDim = btm.count(m_nAxis);


            if (btm.count() == 0)

                top.SetData(0, nSpatialDim * ix, nSpatialDim);

            else

                m_cuda.copy(nSpatialDim, btm.gpu_data, top.mutable_gpu_data, 0, nSpatialDim * ix);


            if (m_bNeedsBackprop)

            {

                Action backward = () =>

                {

                    if (bCopyDiff)

                        m_cuda.copy(nSpatialDim, top.gpu_diff, btm.mutable_gpu_diff, nSpatialDim * ix, 0);

                    m_cuda.copy(nSpatialDim, top.gpu_data, btm.mutable_gpu_data, nSpatialDim * ix, 0);


                    if (m_bCheckForNans)

                        check_nan(btm);

                };

                m_rgBackprop.Add(new Tuple<string, Action>(m_strMarker, backward));

            }


            return top;

        }


        public void CopyToCache(Blob<T> btm, Cache<T> cache)

        {

            string strMarker = marker;

            cache.CopyToCache(btm, m_nAxis);


            if (m_bNeedsBackprop)

            {

                Action backward = () =>

                {

                    cache.CopyFromCache(btm, m_nAxis);

                };

                m_rgBackprop.Add(new Tuple<string, Action>(m_strMarker, backward));

            }

        }


        public Blob<T> tanh(Blob<T> btm, Blob<T> top)

        {

            string strMarker = marker;

            top.ReshapeLike(btm);


            m_cuda.tanh_fwd(btm.count(), btm.gpu_data, top.mutable_gpu_data);


            if (m_bNeedsBackprop)

            {

                Action backward = () =>

                {

                    work.ReshapeLike(btm);

                    m_cuda.tanh_bwd(top.count(), top.gpu_diff, top.gpu_data, work.mutable_gpu_diff);

                    apply(work, btm);


                    if (m_bClipGradients)

                        clip_gradient(btm);

                    if (m_bCheckForNans)

                        check_nan(btm);

                    if (m_bAddDebug)

                        add_debug(strMarker + " - tanh", btm, top);

                };

                m_rgBackprop.Add(new Tuple<string, Action>(m_strMarker, backward));

            }


            return top;

        }


        public Blob<T> sigmoid(Blob<T> btm, Blob<T> top)

        {

            string strMarker = marker;

            top.ReshapeLike(btm);


            m_cuda.sigmoid_fwd(btm.count(), btm.gpu_data, top.mutable_gpu_data);


            if (m_bNeedsBackprop)

            {

                Action backward = () =>

                {

                    work.ReshapeLike(btm);

                    m_cuda.sigmoid_bwd(top.count(), top.gpu_diff, top.gpu_data, work.mutable_gpu_diff);

                    apply(work, btm);


                    if (m_bClipGradients)

                        clip_gradient(btm);

                    if (m_bCheckForNans)

                        check_nan(btm);

                    if (m_bAddDebug)

                        add_debug(strMarker + " - sigmoid", btm, top);

                };

                m_rgBackprop.Add(new Tuple<string, Action>(m_strMarker, backward));

            }


            return top;

        }


        public Blob<T> eltmul(Blob<T> btm1, Blob<T> btm2, Blob<T> top)

        {

            string strMarker = marker;

            top.ReshapeLike(btm1);


            m_cuda.mul(top.count(), btm1.gpu_data, btm2.gpu_data, top.mutable_gpu_data);


            if (m_bNeedsBackprop)

            {

                Action backward = () =>

                {

                    work.ReshapeLike(btm1);

                    m_cuda.mul(btm2.count(), btm2.gpu_data, top.gpu_diff, work.mutable_gpu_diff);

                    apply(work, btm1);

                    work.ReshapeLike(btm2);

                    m_cuda.mul(btm1.count(), btm1.gpu_data, top.gpu_diff, work.mutable_gpu_diff);

                    apply(work, btm2);


                    if (m_bClipGradients)

                        clip_gradient(btm1, btm2);

                    if (m_bCheckForNans)

                        check_nan(btm1, btm2);

                    if (m_bAddDebug)

                        add_debug(strMarker + " - eltmul", btm1, btm2, top);

                };

                m_rgBackprop.Add(new Tuple<string, Action>(m_strMarker, backward));

            }


            return top;

        }


        public Blob<T> scalemul(Blob<T> btm1, Blob<T> btm2, Blob<T> top, int nIdx = 0)

        {

            string strMarker = marker;

            top.ReshapeLike(btm1);


            T fScale = btm2.GetData(nIdx);

            m_cuda.scale(top.count(), fScale, btm1.gpu_data, top.mutable_gpu_data);


            if (m_bNeedsBackprop)

            {

                Action backward = () =>

                {

                    work.ReshapeLike(btm1);

                    m_cuda.scale(top.count(), fScale, top.gpu_diff, work.mutable_gpu_diff);

                    apply(work, btm1);


                    work.ReshapeLike(btm2);

                    float fDot = m_cuda.dot_float(btm1.count(), btm1.gpu_data, top.gpu_diff);

                    work.SetDiff(0);

                    work.SetDiff(fDot, nIdx);

                    apply(work, btm2);


                    if (m_bClipGradients)

                        clip_gradient(btm1, btm2);

                    if (m_bCheckForNans)

                        check_nan(btm1, btm2);

                    if (m_bAddDebug)

                        add_debug(strMarker + " - scalemul", btm1, btm2, top);

                };

                m_rgBackprop.Add(new Tuple<string, Action>(m_strMarker, backward));

            }


            return top;

        }


        public Blob<T> mul(Blob<T> btm1, Blob<T> btm2, Blob<T> top, bool bAccumulateGrad = true)

        {

            string strMarker = marker;

            int nM = btm1.shape(m_nAxis);

            int nN = btm2.count(m_nAxis + 1);

            int nK = btm1.count(m_nAxis + 1);


            List<int> rgShape = Utility.Create<int>(m_nAxis, 1);

            rgShape.Add(nM);

            rgShape.Add(nN);


            top.Reshape(rgShape);


            m_cuda.gemm(false, false, nM, nN, nK, Blob<T>.One, btm1.gpu_data, btm2.gpu_data, Blob<T>.Zero, top.mutable_gpu_data);


            if (m_bNeedsBackprop)

            {

                Action backward = () =>

                {

                    T fBeta = (bAccumulateGrad) ? Blob<T>.One : Blob<T>.Zero;

                    m_cuda.gemm(false, true, nM, nK, nN, Blob<T>.One, top.gpu_diff, btm2.gpu_data, fBeta, btm1.mutable_gpu_diff);

                    m_cuda.gemm(true, false, nK, nN, nM, Blob<T>.One, btm1.gpu_data, top.gpu_diff, fBeta, btm2.mutable_gpu_diff);


                    if (m_bClipGradients)

                        clip_gradient(btm1, btm2);

                    if (m_bCheckForNans)

                        check_nan(btm1, btm2);

                    if (m_bAddDebug)

                        add_debug(strMarker + " - mul", btm1, btm2, top);

                };

                m_rgBackprop.Add(new Tuple<string, Action>(m_strMarker, backward));

            }


            return top;

        }


        public Blob<T> add(Blob<T> btm1, Blob<T> btm2, Blob<T> top, bool bAccumulateGrad = true)

        {

            string strMarker = marker;

            top.ReshapeLike(btm1);


            m_cuda.add(top.count(), btm1.gpu_data, btm2.gpu_data, top.mutable_gpu_data);


            if (m_bNeedsBackprop)

            {

                Action backward = () =>

                {

                    if (!bAccumulateGrad)

                    {

                        btm1.SetDiff(0);

                        btm2.SetDiff(0);

                    }


                    m_cuda.add(btm1.count(), btm1.gpu_diff, top.gpu_diff, btm1.mutable_gpu_diff);

                    m_cuda.add(btm2.count(), btm2.gpu_diff, top.gpu_diff, btm2.mutable_gpu_diff);


                    if (m_bClipGradients)

                        clip_gradient(btm1, btm2);

                    if (m_bCheckForNans)

                        check_nan(btm1, btm2);

                    if (m_bAddDebug)

                        add_debug(strMarker + " - add", btm1, btm2, top);

                };

                m_rgBackprop.Add(new Tuple<string, Action>(m_strMarker, backward));

            }


            return top;

        }


        public Blob<T> clear_grad(Blob<T> b)

        {

            if (m_bNeedsBackprop)

            {

                Action backward = () =>

                {

                    b.SetDiff(0);

                };

                m_rgBackprop.Add(new Tuple<string, Action>(m_strMarker, backward));

            }


            return b;

        }


        public void clear_grad(BlobCollection<T> rg)

        {

            foreach (Blob<T> b in rg)

            {

                clear_grad(b);

            }

        }


        public Blob<T> softmax(Blob<T> btm, Blob<T> top)

        {

            string strMarker = marker;

            top.ReshapeLike(btm);


            int nOuterNum = btm.count(0, m_nAxis);

            int nInnerNum = btm.count(m_nAxis + 1);

            int nChannels = top.shape(m_nAxis);

            int nCount = btm.count();


            work.ReshapeLike(top);


            m_cuda.copy(nCount, btm.gpu_data, top.mutable_gpu_data);


            // We need to subtract the max to avoid numerical issues, compute the exp

            // and then normalize.

            // compute max.

            m_cuda.channel_max(nOuterNum * nInnerNum, nOuterNum, nChannels, nInnerNum, top.gpu_data, work.mutable_gpu_data);

            // subtract

            m_cuda.channel_sub(nCount, nOuterNum, nChannels, nInnerNum, work.gpu_data, top.mutable_gpu_data);

            // exponentiate

            m_cuda.exp(nCount, top.gpu_data, top.mutable_gpu_data);

            // Sum after exp

            m_cuda.channel_sum(nOuterNum * nInnerNum, nOuterNum, nChannels, nInnerNum, top.gpu_data, work.mutable_gpu_data);

            // divide

            m_cuda.channel_div(nCount, nOuterNum, nChannels, nInnerNum, work.gpu_data, top.mutable_gpu_data);


            if (m_bNeedsBackprop)

            {

                Action backward = () =>

                {

                    work.ReshapeLike(top);

                    m_cuda.copy(nCount, top.gpu_diff, work.mutable_gpu_diff);


                    // Compute inner1d(top_diff, top_data) and subtract them from the bottom diff.

                    m_cuda.channel_dot(nOuterNum * nInnerNum, nOuterNum, nChannels, nInnerNum, top.gpu_diff, top.gpu_data, work.mutable_gpu_data);

                    m_cuda.channel_sub(nCount, nOuterNum, nChannels, nInnerNum, work.gpu_data, work.mutable_gpu_diff);


                    // elementwise multiplication

                    m_cuda.mul(nCount, work.gpu_diff, top.gpu_data, work.mutable_gpu_diff);

                    apply(work, btm);


                    if (m_bClipGradients)

                        clip_gradient(btm);

                    if (m_bCheckForNans)

                        check_nan(btm);

                    if (m_bAddDebug)

                        add_debug(strMarker + " - softmax", btm, top);

                };

                m_rgBackprop.Add(new Tuple<string, Action>(m_strMarker, backward));

            }


            return top;

        }


        public int BackwardCount

        {

            get { return m_rgBackprop.Count; }

        }


        public void BackwardOne(int nIdx)

        {

            m_rgBackprop[nIdx].Item2();

        }


        public void Backward(bool bClear = false)

        {

            for (int i = m_rgBackprop.Count - 1; i >= 0; i--)

            {

                m_rgBackprop[i].Item2();

            }


            if (bClear)

                m_rgBackprop.Clear();

        }


        public void Clear()

        {

            m_rgBackprop.Clear();

        }

    }


    public class Cache<T> : IDisposable

    {

        CudaDnn<T> m_cuda;

        Blob<T> m_blobCache;

        int m_nCacheIdx = 0;


        public Cache(CudaDnn<T> cuda, Log log)

        {

            m_cuda = cuda;

            m_blobCache = new Blob<T>(cuda, log, false);

            m_blobCache.Name = "cache";

        }


        public void Dispose()

        {

            if (m_blobCache != null)

            {

                m_blobCache.Dispose();

                m_blobCache = null;

            }

        }


        public void Create(int nCount, List<int> rgItemShape)

        {

            List<int> rgShape = new List<int>(rgItemShape);

            rgShape.Insert(0, nCount);

            m_blobCache.Reshape(rgShape);

        }


        public void Reset()

        {

            m_nCacheIdx = 0;

            m_blobCache.SetData(0);

        }


        public void CopyToCache(Blob<T> b, int nAxis)

        {

            int nSpatialDim = b.count(nAxis);


            if (m_nCacheIdx >= m_blobCache.num)

                throw new Exception("The cache is full!");


            m_cuda.copy(nSpatialDim, b.gpu_data, m_blobCache.mutable_gpu_data, 0, nSpatialDim * m_nCacheIdx);

            m_nCacheIdx++;

        }


        public void CopyFromCache(Blob<T> b, int nAxis)

        {

            int nSpatialDim = b.count(nAxis);


            m_nCacheIdx--;

            if (m_nCacheIdx < 0)

                throw new Exception("The cache is empty!");


            m_cuda.copy(nSpatialDim, m_blobCache.gpu_data, b.mutable_gpu_data, nSpatialDim * m_nCacheIdx, 0);

        }

    }

}

MyCaffe.basecode.Log
The Log class provides general output in text form.
Definition: Log.cs:13

MyCaffe.basecode.Utility
The Utility class provides general utility funtions.
Definition: Utility.cs:35

MyCaffe.basecode.Utility.Create
static List< int > Create(int nCount, int nStart, int nInc)
Create a new List and fill it with values starting with start and incrementing by inc.
Definition: Utility.cs:721

MyCaffe.basecode.Utility.ConvertVec
static double[] ConvertVec(float[] rgf)
Convert an array of float to an array of generics.
Definition: Utility.cs:550

MyCaffe.common.BlobCollection
The BlobCollection contains a list of Blobs.
Definition: BlobCollection.cs:16

MyCaffe.common.Blob
The Blob is the main holder of data that moves through the Layers of the Net.
Definition: Blob.cs:25

MyCaffe.common.Blob.SetData
void SetData(T[] rgData, int nCount=-1, bool bSetCount=true)
Sets a number of items within the Blob's data.
Definition: Blob.cs:1922

MyCaffe.common.Blob.mutable_gpu_diff
long mutable_gpu_diff
Returns the diff GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1555

MyCaffe.common.Blob.mutable_cpu_diff
T[] mutable_cpu_diff
Get diff from the GPU and bring it over to the host, or Set diff from the Host and send it over to th...
Definition: Blob.cs:1511

MyCaffe.common.Blob.mutable_gpu_data
long mutable_gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1487

MyCaffe.common.Blob.mutable_cpu_data
T[] mutable_cpu_data
Get data from the GPU and bring it over to the host, or Set data from the Host and send it over to th...
Definition: Blob.cs:1461

MyCaffe.common.Blob.Reshape
void Reshape(int nNum, int nChannels, int nHeight, int nWidth, bool? bUseHalfSize=null)
DEPRECIATED; use
Definition: Blob.cs:442

MyCaffe.common.Blob.shape
List< int > shape()
Returns an array where each element contains the shape of an axis of the Blob.
Definition: Blob.cs:684

MyCaffe.common.Blob.Zero
static T Zero
Returns Zero (0) in type T.
Definition: Blob.cs:260

MyCaffe.common.Blob.GetData
T GetData(int nIdx)
Returns the data at a given flat index within the Blob.
Definition: Blob.cs:1893

MyCaffe.common.Blob.count
int count()
Returns the total number of items in the Blob.
Definition: Blob.cs:739

MyCaffe.common.Blob.ReshapeLike
void ReshapeLike(Blob< T > b, bool? bUseHalfSize=null)
Reshape this Blob to have the same shape as another Blob.
Definition: Blob.cs:648

MyCaffe.common.Blob.Name
string Name
Get/set the name of the Blob.
Definition: Blob.cs:2184

MyCaffe.common.Blob.gpu_diff
long gpu_diff
Returns the diff GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1541

MyCaffe.common.Blob.Dispose
virtual void Dispose(bool bDisposing)
Releases all resources used by the Blob (including both GPU and Host).
Definition: Blob.cs:402

MyCaffe.common.Blob.SetDiff
void SetDiff(double dfVal, int nIdx=-1)
Either sets all of the diff items in the Blob to a given value, or alternatively only sets a single i...
Definition: Blob.cs:1981

MyCaffe.common.Blob.num
int num
DEPRECIATED; legacy shape accessor num: use shape(0) instead.
Definition: Blob.cs:792

MyCaffe.common.Blob.gpu_data
long gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1479

MyCaffe.common.Cache
The Cache class is used to cache blobs over time.
Definition: ComputeGraph.cs:709

MyCaffe.common.Cache.CopyFromCache
void CopyFromCache(Blob< T > b, int nAxis)
Copies a value from the current location in the cache to the blob.
Definition: ComputeGraph.cs:780

MyCaffe.common.Cache.Cache
Cache(CudaDnn< T > cuda, Log log)
The constructor.
Definition: ComputeGraph.cs:719

MyCaffe.common.Cache.Dispose
void Dispose()
Release any resources used.
Definition: ComputeGraph.cs:729

MyCaffe.common.Cache.Reset
void Reset()
Resets the cache.
Definition: ComputeGraph.cs:753

MyCaffe.common.Cache.CopyToCache
void CopyToCache(Blob< T > b, int nAxis)
Copies a blob to the current location in the cache.
Definition: ComputeGraph.cs:764

MyCaffe.common.Cache.Create
void Create(int nCount, List< int > rgItemShape)
Create the cache memory.
Definition: ComputeGraph.cs:743

MyCaffe.common.ComputeGraph
The ComputeGraph class provides a simple computation graph of operations used in a forward pass that ...
Definition: ComputeGraph.cs:22

MyCaffe.common.ComputeGraph.mul
Blob< T > mul(Blob< T > btm1, Blob< T > btm2, Blob< T > top, bool bAccumulateGrad=true)
'mul' operation performs a blas gemm operation on the 'btm1' matrix with the 'btm2' matrix and places...
Definition: ComputeGraph.cs:494

MyCaffe.common.ComputeGraph.DebugOp
void DebugOp(params Blob< T >[] rgB)
DebugOp operation places a debug stub in the backpropagation chain for debugging only.
Definition: ComputeGraph.cs:186

MyCaffe.common.ComputeGraph.CopyToCache
void CopyToCache(Blob< T > btm, Cache< T > cache)
CopyToCache operation copies the blob into the cache.
Definition: ComputeGraph.cs:322

MyCaffe.common.ComputeGraph.clear_grad
Blob< T > clear_grad(Blob< T > b)
'clear_grad' operation only runs on the backward pass and zeros out the gradients on an input.
Definition: ComputeGraph.cs:576

MyCaffe.common.ComputeGraph.PeekItem
void PeekItem(Blob< T > btm, Blob< T > top, int ix)
PeekItem operation copies a single item from the bottom to the top.
Definition: ComputeGraph.cs:264

MyCaffe.common.ComputeGraph.add
Blob< T > add(Blob< T > btm1, Blob< T > btm2, Blob< T > top, bool bAccumulateGrad=true)
'elthmul' operation adds each element of the 'btm1' with the 'btm2' and places the results in 'top'.
Definition: ComputeGraph.cs:538

MyCaffe.common.ComputeGraph.Debug
Dictionary< string, Blob< T >[]> Debug
Returns a dictionary of Blobs used during each operation, only filled when 'bAddDebug' = true in the ...
Definition: ComputeGraph.cs:79

MyCaffe.common.ComputeGraph.Clear
void Clear()
Clears all backward operations from the list.
Definition: ComputeGraph.cs:698

MyCaffe.common.ComputeGraph.BackwardCount
int BackwardCount
Returns the backward operation count.
Definition: ComputeGraph.cs:667

MyCaffe.common.ComputeGraph.sigmoid
Blob< T > sigmoid(Blob< T > btm, Blob< T > top)
'sigmoid' operation runs the sigmoid on each item in the btm and places the results in the top.
Definition: ComputeGraph.cs:377

MyCaffe.common.ComputeGraph.CopyToRow
Blob< T > CopyToRow(Blob< T > btm, Blob< T > top, int ix, bool bCopyDiff=false)
CopyToRow operation copies the bottom vector into the top matrix.
Definition: ComputeGraph.cs:290

MyCaffe.common.ComputeGraph.clear_grad
void clear_grad(BlobCollection< T > rg)
'clear_grad' operation only runs on the backward pass and zeros out the gradients of the inputs.
Definition: ComputeGraph.cs:594

MyCaffe.common.ComputeGraph.Backward
void Backward(bool bClear=false)
Runs a backward operation on all items starting from the last and running through the first.
Definition: ComputeGraph.cs:684

MyCaffe.common.ComputeGraph.marker
string marker
Get/set a string marker added to the debug information and used to indicate where in the code a given...
Definition: ComputeGraph.cs:87

MyCaffe.common.ComputeGraph.Round
Blob< T > Round(Blob< T > b, int nDecimals=6)
Round operation, rounds the values to the nearest specified decimal.
Definition: ComputeGraph.cs:209

MyCaffe.common.ComputeGraph.tanh
Blob< T > tanh(Blob< T > btm, Blob< T > top)
'tanh' operation runs the tanh on each item in the btm and places the results in the top.
Definition: ComputeGraph.cs:343

MyCaffe.common.ComputeGraph.eltmul
Blob< T > eltmul(Blob< T > btm1, Blob< T > btm2, Blob< T > top)
'elthmul' operation mutliplies each element of the 'btm1' with the 'btm2' and places the results in '...
Definition: ComputeGraph.cs:412

MyCaffe.common.ComputeGraph.softmax
Blob< T > softmax(Blob< T > btm, Blob< T > top)
'softmax' operation runs the softmax on each item in the btm and places the results in the top.
Definition: ComputeGraph.cs:608

MyCaffe.common.ComputeGraph.ComputeGraph
ComputeGraph(CudaDnn< T > cuda, Log log, int nAxis, bool bNeedsBackprop=true, bool bClipGradients=false, bool bCheckNans=false, bool bAddDebug=false)
The constructor.
Definition: ComputeGraph.cs:45

MyCaffe.common.ComputeGraph.BackwardOne
void BackwardOne(int nIdx)
Runs a backward operation at a given index.
Definition: ComputeGraph.cs:675

MyCaffe.common.ComputeGraph.scalemul
Blob< T > scalemul(Blob< T > btm1, Blob< T > btm2, Blob< T > top, int nIdx=0)
'scalemul' operation mutliplies each element of the 'btm1' with the first item within 'btm2' and plac...
Definition: ComputeGraph.cs:451

MyCaffe.common.ComputeGraph.Dispose
void Dispose()
Release all resources used.
Definition: ComputeGraph.cs:60

MyCaffe.common.ComputeGraph.needs_backprop
bool needs_backprop
Get/set whether or not to back propagate.
Definition: ComputeGraph.cs:96

MyCaffe.common.ComputeGraph.axis
int axis
Returns the axis on which all operations are performed.
Definition: ComputeGraph.cs:105

MyCaffe.common.ComputeGraph.PeekRow
Blob< T > PeekRow(Blob< T > btm, Blob< T > top, int ix)
PeeKRow operation copies data and diffs from one row from within the bottom matrix and places it in t...
Definition: ComputeGraph.cs:232

MyCaffe.common.CudaDnn
The CudaDnn object is the main interface to the Low-Level Cuda C++ DLL.
Definition: CudaDnn.cs:969

MyCaffe.common.CudaDnn.copy
void copy(int nCount, long hSrc, long hDst, int nSrcOffset=0, int nDstOffset=0, long hStream=-1, bool? bSrcHalfSizeOverride=null, bool? bDstHalfSizeOverride=null)
Copy data from one block of GPU memory to another.
Definition: CudaDnn.cs:6007

MyCaffe.common.CudaDnn.channel_sub
void channel_sub(int nCount, int nOuterNum, int nChannels, int nInnerNum, long hA, long hX, long hY)
Subtracts the values across the channels of X from A and places the result in Y.
Definition: CudaDnn.cs:8197

MyCaffe.common.CudaDnn.tanh_fwd
void tanh_fwd(int nCount, long hBottomData, long hTopData)
Performs a TanH forward pass in Cuda.
Definition: CudaDnn.cs:9286

MyCaffe.common.CudaDnn.channel_dot
void channel_dot(int nCount, int nOuterNum, int nChannels, int nInnerNum, long hX, long hA, long hY)
Calculates the dot product the the values within each channel of X and places the result in Y.
Definition: CudaDnn.cs:8326

MyCaffe.common.CudaDnn.add
void add(int n, long hA, long hB, long hC, long hY)
Adds A, B and C and places the result in Y.
Definition: CudaDnn.cs:7209

MyCaffe.common.CudaDnn.channel_max
void channel_max(int nCount, int nOuterNum, int nChannels, int nInnerNum, long hX, long hY, bool bReturnIdx=false)
Calculates the maximum value within each channel of X and places the result in Y.
Definition: CudaDnn.cs:8099

MyCaffe.common.CudaDnn.sigmoid_fwd
void sigmoid_fwd(int nCount, long hBottomData, long hTopData)
Performs a Sigmoid forward pass in Cuda.
Definition: CudaDnn.cs:9323

MyCaffe.common.CudaDnn.gemm
void gemm(bool bTransA, bool bTransB, int m, int n, int k, double fAlpha, long hA, long hB, double fBeta, long hC)
Perform a matrix-matrix multiplication operation: C = alpha transB (B) transA (A) + beta C
Definition: CudaDnn.cs:6236

MyCaffe.common.CudaDnn.scale
void scale(int n, double fAlpha, long hX, long hY)
Scales the values in X and places them in Y.
Definition: CudaDnn.cs:6925

MyCaffe.common.CudaDnn.exp
void exp(int n, long hA, long hY)
Calculates the exponent value of A and places the result in Y.
Definition: CudaDnn.cs:7454

MyCaffe.common.CudaDnn.channel_sum
void channel_sum(int nCount, int nOuterNum, int nChannels, int nInnerNum, long hX, long hY, bool bSumAcrossChannels=true, DIR dir=DIR.FWD, int nChannelsY=-1)
Calculates the sum the the values either across or within each channel (depending on bSumAcrossChanne...
Definition: CudaDnn.cs:8236

MyCaffe.common.CudaDnn.dot_float
float dot_float(int n, long hX, long hY)
Computes the dot product of X and Y.
Definition: CudaDnn.cs:6830

MyCaffe.common.CudaDnn.mul
void mul(int n, long hA, long hB, long hY, int nAOff=0, int nBOff=0, int nYOff=0)
Multiplies each element of A with each element of B and places the result in Y.
Definition: CudaDnn.cs:7334

MyCaffe.common.CudaDnn.channel_div
void channel_div(int nCount, int nOuterNum, int nChannels, int nInnerNum, long hX, long hY, int nMethod=1)
Divides the values of the channels from X and places the result in Y.
Definition: CudaDnn.cs:8254

MyCaffe.common.CudaDnn.sigmoid_bwd
void sigmoid_bwd(int nCount, long hTopDiff, long hTopData, long hBottomDiff)
Performs a Sigmoid backward pass in Cuda.
Definition: CudaDnn.cs:9341

MyCaffe.common.CudaDnn.tanh_bwd
void tanh_bwd(int nCount, long hTopDiff, long hTopData, long hBottomDiff)
Performs a TanH backward pass in Cuda.
Definition: CudaDnn.cs:9304

MyCaffe.basecode
The MyCaffe.basecode contains all generic types used throughout MyCaffe.
Definition: Annotation.cs:12

MyCaffe.common
The MyCaffe.common namespace contains common MyCaffe classes.
Definition: BatchInput.cs:8

MyCaffe
The MyCaffe namespace contains the main body of MyCaffe code that closesly tracks the C++ Caffe open-...
Definition: Annotation.cs:12

System
Definition: Component.cs:11