mycaffe/html/pg_8st_2_trainer_p_g_8cs_source.html

using System;

using System.Collections.Generic;

using System.Drawing;

using System.Linq;

using System.Text;

using System.Threading;

using System.Threading.Tasks;

using MyCaffe.basecode;

using MyCaffe.common;

using MyCaffe.fillers;

using MyCaffe.layers;

using MyCaffe.param;

using MyCaffe.solvers;


namespace MyCaffe.trainers.pg.st

{

    public class TrainerPG<T> : IxTrainerRL, IDisposable

    {

        IxTrainerCallback m_icallback;

        CryptoRandom m_random = new CryptoRandom();

        MyCaffeControl<T> m_mycaffe;

        PropertySet m_properties;


        public TrainerPG(MyCaffeControl<T> mycaffe, PropertySet properties, CryptoRandom random, IxTrainerCallback icallback)

        {

            m_icallback = icallback;

            m_mycaffe = mycaffe;

            m_properties = properties;

            m_random = random;

        }


        public void Dispose()

        {

        }


        public bool Initialize()

        {

            m_mycaffe.CancelEvent.Reset();

            m_icallback.OnInitialize(new InitializeArgs(m_mycaffe));

            return true;

        }


        private void wait(int nWait)

        {

            int nWaitInc = 250;

            int nTotalWait = 0;


            while (nTotalWait < nWait)

            {

                m_icallback.OnWait(new WaitArgs(nWaitInc));

                nTotalWait += nWaitInc;

            }

        }


        public bool Shutdown(int nWait)

        {

            if (m_mycaffe != null)

            {

                m_mycaffe.CancelEvent.Set();

                wait(nWait);

            }


            m_icallback.OnShutdown();


            return true;

        }


        public ResultCollection RunOne(int nDelay = 1000)

        {

            m_mycaffe.CancelEvent.Reset();

            Agent<T> agent = new Agent<T>(m_icallback, m_mycaffe, m_properties, m_random, Phase.TRAIN);

            agent.Run(Phase.TEST, 1, ITERATOR_TYPE.ITERATION, TRAIN_STEP.NONE);

            agent.Dispose();

            return null;

        }


        public byte[] Run(int nN, PropertySet runProp, out string type)

        {

            m_mycaffe.CancelEvent.Reset();

            Agent<T> agent = new Agent<T>(m_icallback, m_mycaffe, m_properties, m_random, Phase.RUN);

            byte[] rgResults = agent.Run(nN, out type);

            agent.Dispose();


            return rgResults;

        }


        public bool Test(int nN, ITERATOR_TYPE type)

        {

            int nDelay = 1000;

            string strProp = m_properties.ToString();


            // Turn off the num-skip to run at normal speed.

            strProp += "EnableNumSkip=False;";

            PropertySet properties = new PropertySet(strProp);


            m_mycaffe.CancelEvent.Reset();

            Agent<T> agent = new Agent<T>(m_icallback, m_mycaffe, properties, m_random, Phase.TRAIN);

            agent.Run(Phase.TEST, nN, type, TRAIN_STEP.NONE);


            agent.Dispose();

            Shutdown(nDelay);


            return true;

        }


        public bool Train(int nN, ITERATOR_TYPE type, TRAIN_STEP step)

        {

            m_mycaffe.CancelEvent.Reset();

            Agent<T> agent = new Agent<T>(m_icallback, m_mycaffe, m_properties, m_random, Phase.TRAIN);

            agent.Run(Phase.TRAIN, nN, type, step);

            agent.Dispose();


            return false;

        }

    }


    class Agent<T> : IDisposable

    {

        IxTrainerCallback m_icallback;

        Brain<T> m_brain;

        PropertySet m_properties;

        CryptoRandom m_random;

        float m_fGamma;

        bool m_bAllowDiscountReset = false;

        bool m_bUseRawInput = false;


        public Agent(IxTrainerCallback icallback, MyCaffeControl<T> mycaffe, PropertySet properties, CryptoRandom random, Phase phase)

        {

            m_icallback = icallback;

            m_brain = new Brain<T>(mycaffe, properties, random, phase);

            m_properties = properties;

            m_random = random;


            m_fGamma = (float)properties.GetPropertyAsDouble("Gamma", 0.99);

            m_bAllowDiscountReset = properties.GetPropertyAsBool("AllowDiscountReset", false);

            m_bUseRawInput = properties.GetPropertyAsBool("UseRawInput", false);

        }


        public void Dispose()

        {

            if (m_brain != null)

            {

                m_brain.Dispose();

                m_brain = null;

            }

        }


        private StateBase getData(Phase phase, int nAction)

        {

            GetDataArgs args = m_brain.getDataArgs(phase, nAction);

            m_icallback.OnGetData(args);

            return args.State;

        }


        private void updateStatus(int nIteration, int nEpisodeCount, double dfRewardSum, double dfRunningReward)

        {

            GetStatusArgs args = new GetStatusArgs(0, nIteration, nEpisodeCount, 1000000, dfRunningReward, dfRewardSum, 0, 0, 0, 0);

            m_icallback.OnUpdateStatus(args);

        }


        public byte[] Run(int nIterations, out string type)

        {

            IxTrainerCallbackRNN icallback = m_icallback as IxTrainerCallbackRNN;

            if (icallback == null)

                throw new Exception("The Run method requires an IxTrainerCallbackRNN interface to convert the results into the native format!");


            StateBase s = getData(Phase.RUN, -1);

            int nIteration = 0;

            List<float> rgResults = new List<float>();


            while (!m_brain.Cancel.WaitOne(0) && (nIterations == -1 || nIteration < nIterations))

            {

                // Preprocess the observation.

                SimpleDatum x = m_brain.Preprocess(s, m_bUseRawInput);


                // Forward the policy network and sample an action.

                float[] rgfAprob;

                int action = m_brain.act(x, s.Clip, out rgfAprob);


                rgResults.Add(s.Data.TimeStamp.ToFileTime());

                rgResults.Add((float)s.Data.GetDataAtF(0));

                rgResults.Add(action);


                // Take the next step using the action

                StateBase s_ = getData(Phase.RUN, action);

                nIteration++;

            }


            ConvertOutputArgs args = new ConvertOutputArgs(nIterations, rgResults.ToArray());

            icallback.OnConvertOutput(args);


            type = args.RawType;

            return args.RawOutput;

        }


        private bool isAtIteration(int nN, ITERATOR_TYPE type, int nIteration, int nEpisode)

        {

            if (nN == -1)

                return false;


            if (type == ITERATOR_TYPE.EPISODE)

            {

                if (nEpisode < nN)

                    return false;


                return true;

            }

            else

            {

                if (nIteration < nN)

                    return false;


                return true;

            }

        }


        public void Run(Phase phase, int nN, ITERATOR_TYPE type, TRAIN_STEP step)

        {

            MemoryCollection m_rgMemory = new MemoryCollection();

            double? dfRunningReward = null;

            double dfEpisodeReward = 0;

            int nEpisode = 0;

            int nIteration = 0;


            StateBase s = getData(phase, -1);


            while (!m_brain.Cancel.WaitOne(0) && !isAtIteration(nN, type, nIteration, nEpisode))

            {

                // Preprocess the observation.

                SimpleDatum x = m_brain.Preprocess(s, m_bUseRawInput);


                // Forward the policy network and sample an action.

                float[] rgfAprob;

                int action = m_brain.act(x, s.Clip, out rgfAprob);


                if (step == TRAIN_STEP.FORWARD)

                    return;


                // Take the next step using the action

                StateBase s_ = getData(phase, action);

                dfEpisodeReward += s_.Reward;


                if (phase == Phase.TRAIN)

                {

                    // Build up episode memory, using reward for taking the action.

                    m_rgMemory.Add(new MemoryItem(s, x, action, rgfAprob, (float)s_.Reward));


                    // An episode has finished.

                    if (s_.Done)

                    {

                        nEpisode++;

                        nIteration++;


                        m_brain.Reshape(m_rgMemory);


                        // Compute the discounted reward (backwards through time)

                        float[] rgDiscountedR = m_rgMemory.GetDiscountedRewards(m_fGamma, m_bAllowDiscountReset);

                        // Rewards are standardized when set to be unit normal (helps control the gradient estimator variance)

                        m_brain.SetDiscountedR(rgDiscountedR);


                        // Get the action probabilities.

                        float[] rgfAprobSet = m_rgMemory.GetActionProbabilities();

                        // The action probabilities are used to calculate the initial gradient within the loss function.

                        m_brain.SetActionProbabilities(rgfAprobSet);


                        // Get the action one-hot vectors.  When using Softmax, this contains the one-hot vector containing

                        // each action set (e.g. 3 actions with action 0 set would return a vector <1,0,0>).

                        // When using a binary probability (e.g. with Sigmoid), the each action set only contains a

                        // single element which is set to the action value itself (e.g. 0 for action '0' and 1 for action '1')

                        float[] rgfAonehotSet = m_rgMemory.GetActionOneHotVectors();

                        m_brain.SetActionOneHotVectors(rgfAonehotSet);


                        // Train for one iteration, which triggers the loss function.

                        List<Datum> rgData = m_rgMemory.GetData();

                        List<Datum> rgClip = m_rgMemory.GetClip();

                        m_brain.SetData(rgData, rgClip);

                        m_brain.Train(nIteration, step);


                        // Update reward running

                        if (!dfRunningReward.HasValue)

                            dfRunningReward = dfEpisodeReward;

                        else

                            dfRunningReward = dfRunningReward * 0.99 + dfEpisodeReward * 0.01;


                        updateStatus(nIteration, nEpisode, dfEpisodeReward, dfRunningReward.Value);

                        dfEpisodeReward = 0;


                        s = getData(phase, -1);

                        m_rgMemory.Clear();


                        if (step != TRAIN_STEP.NONE)

                            return;

                    }

                    else

                    {

                        s = s_;

                    }

                }

                else

                {

                    if (s_.Done)

                    {

                        nEpisode++;


                        // Update reward running

                        if (!dfRunningReward.HasValue)

                            dfRunningReward = dfEpisodeReward;

                        else

                            dfRunningReward = dfRunningReward * 0.99 + dfEpisodeReward * 0.01;


                        updateStatus(nIteration, nEpisode, dfEpisodeReward, dfRunningReward.Value);

                        dfEpisodeReward = 0;


                        s = getData(phase, -1);

                    }

                    else

                    {

                        s = s_;

                    }


                    nIteration++;

                }

            }

        }

    }


    class Brain<T> : IDisposable

    {

        MyCaffeControl<T> m_mycaffe;

        Net<T> m_net;

        Solver<T> m_solver;

        MemoryDataLayer<T> m_memData;

        MemoryLossLayer<T> m_memLoss;

        SoftmaxLayer<T> m_softmax = null;

        SoftmaxCrossEntropyLossLayer<T> m_softmaxCe = null;

        bool m_bSoftmaxCeSetup = false;

        PropertySet m_properties;

        CryptoRandom m_random;

        BlobCollection<T> m_colAccumulatedGradients = new BlobCollection<T>();

        Blob<T> m_blobDiscountedR;

        Blob<T> m_blobPolicyGradient;

        Blob<T> m_blobActionOneHot;

        Blob<T> m_blobDiscountedR1;

        Blob<T> m_blobPolicyGradient1;

        Blob<T> m_blobActionOneHot1;

        Blob<T> m_blobLoss;

        Blob<T> m_blobAprobLogit;

        bool m_bSkipLoss;

        int m_nMiniBatch = 10;

        SimpleDatum m_sdLast = null;

        int m_nRecurrentSequenceLength = 0;

        List<Datum> m_rgData = null;

        List<Datum> m_rgClip = null;


        public Brain(MyCaffeControl<T> mycaffe, PropertySet properties, CryptoRandom random, Phase phase)

        {

            m_mycaffe = mycaffe;

            m_net = mycaffe.GetInternalNet(phase);

            m_solver = mycaffe.GetInternalSolver();

            m_properties = properties;

            m_random = random;


            m_memData = m_net.FindLayer(LayerParameter.LayerType.MEMORYDATA, null) as MemoryDataLayer<T>;

            m_memLoss = m_net.FindLayer(LayerParameter.LayerType.MEMORY_LOSS, null) as MemoryLossLayer<T>;

            m_softmax = m_net.FindLayer(LayerParameter.LayerType.SOFTMAX, null) as SoftmaxLayer<T>;


            if (m_memData == null)

                throw new Exception("Could not find the MemoryData Layer!");


            if (m_memLoss == null)

                throw new Exception("Could not find the MemoryLoss Layer!");


            m_memData.OnDataPack += memData_OnDataPack;

            m_memLoss.OnGetLoss += memLoss_OnGetLoss;


            m_blobDiscountedR = new Blob<T>(mycaffe.Cuda, mycaffe.Log);

            m_blobPolicyGradient = new Blob<T>(mycaffe.Cuda, mycaffe.Log);

            m_blobActionOneHot = new Blob<T>(mycaffe.Cuda, mycaffe.Log);

            m_blobDiscountedR1 = new Blob<T>(mycaffe.Cuda, mycaffe.Log);

            m_blobPolicyGradient1 = new Blob<T>(mycaffe.Cuda, mycaffe.Log);

            m_blobActionOneHot1 = new Blob<T>(mycaffe.Cuda, mycaffe.Log);

            m_blobLoss = new Blob<T>(mycaffe.Cuda, mycaffe.Log);

            m_blobAprobLogit = new Blob<T>(mycaffe.Cuda, mycaffe.Log);


            if (m_softmax != null)

            {

                LayerParameter p = new LayerParameter(LayerParameter.LayerType.SOFTMAXCROSSENTROPY_LOSS);

                p.loss_weight.Add(1);

                p.loss_weight.Add(0);

                p.loss_param.normalization = LossParameter.NormalizationMode.NONE;

                m_softmaxCe = new SoftmaxCrossEntropyLossLayer<T>(mycaffe.Cuda, mycaffe.Log, p);

            }


            m_colAccumulatedGradients = m_net.learnable_parameters.Clone();

            m_colAccumulatedGradients.SetDiff(0);


            int nMiniBatch = mycaffe.CurrentProject.GetBatchSize(phase);

            if (nMiniBatch != 0)

                m_nMiniBatch = nMiniBatch;


            m_nMiniBatch = m_properties.GetPropertyAsInt("MiniBatch", m_nMiniBatch);

        }


        private void dispose(ref Blob<T> b)

        {

            if (b != null)

            {

                b.Dispose();

                b = null;

            }

        }


        public void Dispose()

        {

            m_memLoss.OnGetLoss -= memLoss_OnGetLoss;

            dispose(ref m_blobDiscountedR);

            dispose(ref m_blobPolicyGradient);

            dispose(ref m_blobActionOneHot);

            dispose(ref m_blobDiscountedR1);

            dispose(ref m_blobPolicyGradient1);

            dispose(ref m_blobActionOneHot1);

            dispose(ref m_blobLoss);

            dispose(ref m_blobAprobLogit);


            if (m_colAccumulatedGradients != null)

            {

                m_colAccumulatedGradients.Dispose();

                m_colAccumulatedGradients = null;

            }

        }


        public int RecurrentSequenceLength

        {

            get { return m_nRecurrentSequenceLength; }

        }


        public int Reshape(MemoryCollection col)

        {

            int nNum = col.Count;

            int nChannels = col[0].Data.Channels;

            int nHeight = col[0].Data.Height;

            int nWidth = col[0].Data.Height;

            int nActionProbs = 1;

            int nFound = 0;


            for (int i = 0; i < m_net.output_blobs.Count; i++)

            {

                if (m_net.output_blobs[i].type != BLOB_TYPE.LOSS)

                {

                    int nCh = m_net.output_blobs[i].channels;

                    nActionProbs = Math.Max(nCh, nActionProbs);

                    nFound++;

                }

            }


            if (nFound == 0)

                throw new Exception("Could not find a non-loss output!  Your model should output the loss and the action probabilities.");


            m_blobDiscountedR.Reshape(nNum, nActionProbs, 1, 1);

            m_blobPolicyGradient.Reshape(nNum, nActionProbs, 1, 1);

            m_blobActionOneHot.Reshape(nNum, nActionProbs, 1, 1);

            m_blobDiscountedR1.Reshape(nNum, nActionProbs, 1, 1);

            m_blobPolicyGradient1.Reshape(nNum, nActionProbs, 1, 1);

            m_blobActionOneHot1.Reshape(nNum, nActionProbs, 1, 1);

            m_blobLoss.Reshape(1, 1, 1, 1);


            return nActionProbs;

        }


        public void SetDiscountedR(float[] rg)

        {

            double dfMean = m_blobDiscountedR.mean(rg);

            double dfStd = m_blobDiscountedR.std(dfMean, rg);

            int nC = m_blobDiscountedR.channels;


            // Fill all items in each channel with the same discount value.

            if (nC > 1)

            {

                List<float> rgR = new List<float>();


                for (int i = 0; i < rg.Length; i++)

                {

                    for (int j = 0; j < nC; j++)

                    {

                        rgR.Add(rg[i]);

                    }

                }


                rg = rgR.ToArray();

            }


            m_blobDiscountedR.SetData(Utility.ConvertVec<T>(rg));

            m_blobDiscountedR.NormalizeData(dfMean, dfStd);

        }


        public void SetActionProbabilities(float[] rg)

        {

            m_blobPolicyGradient.SetData(Utility.ConvertVec<T>(rg));

        }


        public void SetActionOneHotVectors(float[] rg)

        {

            m_blobActionOneHot.SetData(Utility.ConvertVec<T>(rg));

        }


        public void SetData(List<Datum> rgData, List<Datum> rgClip)

        {

            if (m_nRecurrentSequenceLength != 1 && rgData.Count > 1 && rgClip != null)

            {

                m_rgData = rgData;

                m_rgClip = rgClip;

            }

            else

            {

                m_memData.AddDatumVector(rgData, rgClip, 1, true, true);

                m_rgData = null;

                m_rgClip = null;

            }

        }


        public GetDataArgs getDataArgs(Phase phase, int nAction)

        {

            bool bReset = (nAction == -1) ? true : false;

            return new GetDataArgs(phase, 0, m_mycaffe, m_mycaffe.Log, m_mycaffe.CancelEvent, bReset, nAction, true);

        }


        public Log Log

        {

            get { return m_mycaffe.Log; }

        }


        public CancelEvent Cancel

        {

            get { return m_mycaffe.CancelEvent; }

        }


        public SimpleDatum Preprocess(StateBase s, bool bUseRawInput)

        {

            SimpleDatum sd = new SimpleDatum(s.Data, true);


            if (bUseRawInput)

                return sd;


            if (m_sdLast == null)

                sd.Zero();

            else

                sd.Sub(m_sdLast);


            m_sdLast = s.Data;


            return sd;

        }


        public int act(SimpleDatum sd, SimpleDatum sdClip, out float[] rgfAprob)

        {

            List<Datum> rgData = new List<Datum>();

            rgData.Add(new Datum(sd));

            double dfLoss;

            float fRandom = (float)m_random.NextDouble(); // Roll the dice.

            List<Datum> rgClip = null;


            if (sdClip != null)

            {

                rgClip = new List<Datum>();

                rgClip.Add(new Datum(sdClip));

            }


            m_memData.AddDatumVector(rgData, rgClip, 1, true, true);

            m_bSkipLoss = true;

            BlobCollection<T> res = m_net.Forward(out dfLoss);

            m_bSkipLoss = false;


            rgfAprob = null;


            for (int i = 0; i < res.Count; i++)

            {

                if (res[i].type != BLOB_TYPE.LOSS)

                {

                    int nStart = 0;

                    // When using recurrent learning, only act on the last outputs.

                    if (m_nRecurrentSequenceLength > 1 && res[i].num > 1)

                    {

                        int nCount = res[i].count();

                        int nOutput = nCount / res[i].num;

                        nStart = nCount - nOutput;


                        if (nStart < 0)

                            throw new Exception("The start must be zero or greater!");

                    }


                    rgfAprob = Utility.ConvertVecF<T>(res[i].update_cpu_data(), nStart);

                    break;

                }

            }


            if (rgfAprob == null)

                throw new Exception("Could not find a non-loss output!  Your model should output the loss and the action probabilities.");


            // Select the action from the probability distribution.

            float fSum = 0;

            for (int i = 0; i < rgfAprob.Length; i++)

            {

                fSum += rgfAprob[i];


                if (fRandom < fSum)

                    return i;

            }


            if (rgfAprob.Length == 1)

                return 1;


            return rgfAprob.Length - 1;

        }


        private void prepareBlob(Blob<T> b1, Blob<T> b)

        {

            b1.CopyFrom(b, 0, 0, b1.count(), true, true);

            b.Reshape(1, b.channels, b.height, b.width);

        }


        private void copyBlob(int nIdx, Blob<T> src, Blob<T> dst)

        {

            int nCount = dst.count();

            dst.CopyFrom(src, nIdx * nCount, 0, nCount, true, false);

        }


        public void Train(int nIteration, TRAIN_STEP step)

        {

            m_mycaffe.Log.Enable = false;


            // Run data/clip groups > 1 in non batch mode.

            if (m_nRecurrentSequenceLength != 1 && m_rgData != null && m_rgData.Count > 1 && m_rgClip != null)

            {

                prepareBlob(m_blobActionOneHot1, m_blobActionOneHot);

                prepareBlob(m_blobDiscountedR1, m_blobDiscountedR);

                prepareBlob(m_blobPolicyGradient1, m_blobPolicyGradient);


                for (int i = 0; i < m_rgData.Count; i++)

                {

                    copyBlob(i, m_blobActionOneHot1, m_blobActionOneHot);

                    copyBlob(i, m_blobDiscountedR1, m_blobDiscountedR);

                    copyBlob(i, m_blobPolicyGradient1, m_blobPolicyGradient);


                    List<Datum> rgData1 = new List<Datum>() { m_rgData[i] };

                    List<Datum> rgClip1 = new List<Datum>() { m_rgClip[i] };


                    m_memData.AddDatumVector(rgData1, rgClip1, 1, true, true);


                    m_solver.Step(1, step, true, false, true, true);

                }


                m_blobActionOneHot.ReshapeLike(m_blobActionOneHot1);

                m_blobDiscountedR.ReshapeLike(m_blobDiscountedR1);

                m_blobPolicyGradient.ReshapeLike(m_blobPolicyGradient1);


                m_rgData = null;

                m_rgClip = null;

            }

            else

            {

                m_solver.Step(1, step, true, false, true, true);

            }


            m_colAccumulatedGradients.Accumulate(m_mycaffe.Cuda, m_net.learnable_parameters, true);


            if (nIteration % m_nMiniBatch == 0 || step == TRAIN_STEP.BACKWARD || step == TRAIN_STEP.BOTH)

            {

                m_net.learnable_parameters.CopyFrom(m_colAccumulatedGradients, true);

                m_colAccumulatedGradients.SetDiff(0);

                m_solver.ApplyUpdate(nIteration);

                m_net.ClearParamDiffs();

            }


            m_mycaffe.Log.Enable = true;

        }


        private T[] unpackLabel(Datum d)

        {

            if (d.DataCriteria == null)

                return null;


            if (d.DataCriteriaFormat == SimpleDatum.DATA_FORMAT.LIST_FLOAT)

            {

                List<float> rgf = BinaryData.UnPackFloatList(d.DataCriteria, SimpleDatum.DATA_FORMAT.LIST_FLOAT);

                return Utility.ConvertVec<T>(rgf.ToArray());

            }

            else if (d.DataCriteriaFormat == SimpleDatum.DATA_FORMAT.LIST_DOUBLE)

            {

                List<double> rgf = BinaryData.UnPackDoubleList(d.DataCriteria, SimpleDatum.DATA_FORMAT.LIST_DOUBLE);

                return Utility.ConvertVec<T>(rgf.ToArray());

            }


            return null;

        }


        private void memData_OnDataPack(object sender, MemoryDataLayerPackDataArgs<T> e)

        {

            List<int> rgDataShape = e.Data.shape();

            List<int> rgClipShape = e.Clip.shape();

            List<int> rgLabelShape = e.Label.shape();

            int nBatch = e.DataItems.Count;

            int nSeqLen = rgDataShape[0];


            e.Data.Log.CHECK_GT(nSeqLen, 0, "The sequence lenth must be greater than zero!");

            e.Data.Log.CHECK_EQ(nBatch, e.ClipItems.Count, "The data and clip should have the same number of items.");

            e.Data.Log.CHECK_EQ(nSeqLen, rgClipShape[0], "The data and clip should have the same sequence count.");


            rgDataShape[1] = nBatch;  // LSTM uses sizing: seq, batch, data1, data2

            rgClipShape[1] = nBatch;

            rgLabelShape[1] = nBatch;


            e.Data.Reshape(rgDataShape);

            e.Clip.Reshape(rgClipShape);

            e.Label.Reshape(rgLabelShape);


            T[] rgRawData = new T[e.Data.count()];

            T[] rgRawClip = new T[e.Clip.count()];

            T[] rgRawLabel = new T[e.Label.count()];


            int nDataSize = e.Data.count(2);

            T[] rgDataItem = new T[nDataSize];

            T dfClip;

            int nIdx;


            for (int i = 0; i < nBatch; i++)

            {

                Datum data = e.DataItems[i];

                Datum clip = e.ClipItems[i];


                T[] rgLabel = unpackLabel(data);


                for (int j = 0; j < nSeqLen; j++)

                {

                    dfClip = clip.GetDataAt<T>(j);


                    for (int k = 0; k < nDataSize; k++)

                    {

                        rgDataItem[k] = data.GetDataAt<T>(j * nDataSize + k);

                    }


                    // LSTM: Create input data, the data must be in the order

                    // seq1_val1, seq2_val1, ..., seqBatch_Size_val1, seq1_val2, seq2_val2, ..., seqBatch_Size_valSequence_Length

                    if (e.LstmType == LayerParameter.LayerType.LSTM)

                        nIdx = nBatch * j + i;


                    // LSTM_SIMPLE: Create input data, the data must be in the order

                    // seq1_val1, seq1_val2, ..., seq1_valBatchSize, seq2_val1, seq2_val2, ..., seqSequenceLength_valBatchSize

                    else

                        nIdx = i * nBatch + j;


                    Array.Copy(rgDataItem, 0, rgRawData, nIdx * nDataSize, nDataSize);

                    rgRawClip[nIdx] = dfClip;


                    if (rgLabel != null)

                    {

                        if (rgLabel.Length == nSeqLen)

                            rgRawLabel[nIdx] = rgLabel[j];

                        else if (rgLabel.Length == 1)

                        {

                            if (j == nSeqLen - 1)

                                rgRawLabel[0] = rgLabel[0];

                        }

                        else

                        {

                            throw new Exception("The Solver SequenceLength parameter does not match the actual sequence length!  The label length '" + rgLabel.Length.ToString() + "' must be either '1' for SINGLE labels, or the sequence length of '" + nSeqLen.ToString() + "' for MULTI labels.  Stopping training.");

                        }

                    }

                }

            }


            e.Data.mutable_cpu_data = rgRawData;

            e.Clip.mutable_cpu_data = rgRawClip;

            e.Label.mutable_cpu_data = rgRawLabel;

            m_nRecurrentSequenceLength = nSeqLen;

        }


        private void memLoss_OnGetLoss(object sender, MemoryLossLayerGetLossArgs<T> e)

        {

            if (m_bSkipLoss)

                return;


            int nCount = m_blobPolicyGradient.count();

            long hActionOneHot = m_blobActionOneHot.gpu_data;

            long hPolicyGrad = m_blobPolicyGradient.mutable_gpu_data;

            long hDiscountedR = m_blobDiscountedR.gpu_data;

            double dfLoss;

            Blob<T> blobOriginalBottom = e.Bottom[0];

            int nDataSize = e.Bottom[0].count(1);

            bool bUsingEndData = false;


            // When using a recurrent model and receiving data with more than one sequence,

            // copy and only use the last sequence data.

            if (m_nRecurrentSequenceLength > 1)

            {

                if (e.Bottom[0].num > 1)

                {

                    m_blobAprobLogit.CopyFrom(e.Bottom[0], false, true);

                    m_blobAprobLogit.CopyFrom(e.Bottom[0], true);


                    List<int> rgShape = e.Bottom[0].shape();

                    rgShape[0] = 1;

                    e.Bottom[0].Reshape(rgShape);

                    e.Bottom[0].CopyFrom(m_blobAprobLogit, (m_blobAprobLogit.num - 1) * nDataSize, 0, nDataSize, true, true);

                    bUsingEndData = true;

                }

            }


            long hBottomDiff = e.Bottom[0].mutable_gpu_diff;


            // Calculate the initial gradients (policy grad initially just contains the action probabilities)

            if (m_softmax != null)

            {

                BlobCollection<T> colBottom = new BlobCollection<T>();

                BlobCollection<T> colTop = new BlobCollection<T>();


                colBottom.Add(e.Bottom[0]);             // aprob logit

                colBottom.Add(m_blobActionOneHot);      // action one-hot vectors

                colTop.Add(m_blobLoss);

                colTop.Add(m_blobPolicyGradient);


                if (!m_bSoftmaxCeSetup)

                {

                    m_softmaxCe.Setup(colBottom, colTop);

                    m_bSoftmaxCeSetup = true;

                }


                dfLoss = m_softmaxCe.Forward(colBottom, colTop);

                m_softmaxCe.Backward(colTop, new List<bool>() { true, false }, colBottom);

                hPolicyGrad = colBottom[0].gpu_diff;

            }

            else

            {

                // Calculate (a=0) ? 1-aprob : 0-aprob

                m_mycaffe.Cuda.add_scalar(nCount, -1.0, hActionOneHot); // invert one hot

                m_mycaffe.Cuda.abs(nCount, hActionOneHot, hActionOneHot);

                m_mycaffe.Cuda.mul_scalar(nCount, -1.0, hPolicyGrad);   // negate Aprob

                m_mycaffe.Cuda.add(nCount, hActionOneHot, hPolicyGrad, hPolicyGrad);  // gradient = ((a=0)?1:0) - Aprob

                dfLoss = Utility.ConvertVal<T>(m_blobPolicyGradient.sumsq_data());


                m_mycaffe.Cuda.mul_scalar(nCount, -1.0, hPolicyGrad); // invert for we ApplyUpdate subtracts the gradients

            }


            // Modulate the gradient with the advantage (PG magic happens right here.)

            m_mycaffe.Cuda.mul(nCount, hPolicyGrad, hDiscountedR, hPolicyGrad);


            e.Loss = dfLoss;

            e.EnableLossUpdate = false; // apply gradients to bottom directly.


            if (hPolicyGrad != hBottomDiff)

                m_mycaffe.Cuda.copy(nCount, hPolicyGrad, hBottomDiff);


            // When using recurrent model with more than one sequence of data, only

            // copy the diff to the last in the sequence and zero out the rest in the sequence.

            if (m_nRecurrentSequenceLength > 1 && bUsingEndData)

            {

                m_blobAprobLogit.SetDiff(0);

                m_blobAprobLogit.CopyFrom(e.Bottom[0], 0, (m_blobAprobLogit.num - 1) * nDataSize, nDataSize, false, true);

                e.Bottom[0].CopyFrom(m_blobAprobLogit, false, true);

                e.Bottom[0].CopyFrom(m_blobAprobLogit, true);

            }

        }

    }


    class MemoryCollection : GenericList<MemoryItem>

    {

        public MemoryCollection()

        {

        }


        public float[] GetDiscountedRewards(float fGamma, bool bAllowReset)

        {

            float fRunningAdd = 0;

            float[] rgR = m_rgItems.Select(p => p.Reward).ToArray();

            float[] rgDiscountedR = new float[rgR.Length];


            for (int t = Count - 1; t >= 0; t--)

            {

                if (bAllowReset && rgR[t] != 0)

                    fRunningAdd = 0;


                fRunningAdd = fRunningAdd * fGamma + rgR[t];

                rgDiscountedR[t] = fRunningAdd;

            }


            return rgDiscountedR;

        }


        public float[] GetActionProbabilities()

        {

            List<float> rgfAprob = new List<float>();


            for (int i = 0; i < m_rgItems.Count; i++)

            {

                rgfAprob.AddRange(m_rgItems[i].Aprob);

            }


            return rgfAprob.ToArray();

        }


        public float[] GetActionOneHotVectors()

        {

            List<float> rgfAonehot = new List<float>();


            for (int i = 0; i < m_rgItems.Count; i++)

            {

                float[] rgfOneHot = new float[m_rgItems[0].Aprob.Length];


                if (rgfOneHot.Length == 1)

                    rgfOneHot[0] = m_rgItems[i].Action;

                else

                    rgfOneHot[m_rgItems[i].Action] = 1;


                rgfAonehot.AddRange(rgfOneHot);

            }


            return rgfAonehot.ToArray();

        }


        public List<Datum> GetData()

        {

            List<Datum> rgData = new List<Datum>();


            for (int i = 0; i < m_rgItems.Count; i++)

            {

                rgData.Add(new Datum(m_rgItems[i].Data));

            }


            return rgData;

        }


        public List<Datum> GetClip()

        {

            if (m_rgItems.Count == 0)

                return null;


            if (m_rgItems[0].State.Clip == null)

                return null;


            List<Datum> rgData = new List<Datum>();


            for (int i = 0; i < m_rgItems.Count; i++)

            {

                if (m_rgItems[i].State.Clip == null)

                    return null;


                rgData.Add(new Datum(m_rgItems[i].State.Clip));

            }


            return rgData;

        }

    }


    class MemoryItem

    {

        StateBase m_state;

        SimpleDatum m_x;

        int m_nAction;

        float[] m_rgfAprob;

        float m_fReward;


        public MemoryItem(StateBase s, SimpleDatum x, int nAction, float[] rgfAprob, float fReward)

        {

            m_state = s;

            m_x = x;

            m_nAction = nAction;

            m_rgfAprob = rgfAprob;

            m_fReward = fReward;

        }


        public StateBase State

        {

            get { return m_state; }

        }


        public SimpleDatum Data

        {

            get { return m_x; }

        }


        public int Action

        {

            get { return m_nAction; }

        }


        public float Reward

        {

            get { return m_fReward; }

        }


        public float[] Aprob

        {

            get { return m_rgfAprob; }

        }


        public override string ToString()

        {

            return "action = " + m_nAction.ToString() + " reward = " + m_fReward.ToString("N2") + " aprob = " + tostring(m_rgfAprob);

        }


        private string tostring(float[] rg)

        {

            string str = "{";


            for (int i = 0; i < rg.Length; i++)

            {

                str += rg[i].ToString("N5");

                str += ",";

            }


            str = str.TrimEnd(',');

            str += "}";


            return str;

        }

    }

}

MyCaffe.MyCaffeControl
The MyCaffeControl is the main object used to manage all training, testing and running of the MyCaffe...
Definition: MyCaffeControl.cs:35

MyCaffe.MyCaffeControl.CancelEvent
CancelEvent CancelEvent
Returns the CancelEvent used.
Definition: MyCaffeControl.cs:648

MyCaffe.basecode.BinaryData
The BinaryData class is used to pack and unpack DataCriteria binary data, optionally stored within ea...
Definition: BinaryData.cs:15

MyCaffe.basecode.BinaryData.UnPackDoubleList
static List< double > UnPackDoubleList(byte[] rg, DATA_FORMAT fmtExpected)
Unpack the byte array into a list of double values.
Definition: BinaryData.cs:75

MyCaffe.basecode.BinaryData.UnPackFloatList
static List< float > UnPackFloatList(byte[] rg, DATA_FORMAT fmtExpected)
Unpack the byte array into a list of float values.
Definition: BinaryData.cs:132

MyCaffe.basecode.CancelEvent
The CancelEvent provides an extension to the manual cancel event that allows for overriding the manua...
Definition: CancelEvent.cs:17

MyCaffe.basecode.CancelEvent.Reset
void Reset()
Resets the event clearing any signaled state.
Definition: CancelEvent.cs:279

MyCaffe.basecode.CancelEvent.CancelEvent
CancelEvent()
The CancelEvent constructor.
Definition: CancelEvent.cs:28

MyCaffe.basecode.CancelEvent.Set
void Set()
Sets the event to the signaled state.
Definition: CancelEvent.cs:270

MyCaffe.basecode.CryptoRandom
The CryptoRandom is a random number generator that can use either the standard .Net Random objec or t...
Definition: CryptoRandom.cs:14

MyCaffe.basecode.CryptoRandom.NextDouble
double NextDouble()
Returns a random double within the range .
Definition: CryptoRandom.cs:83

MyCaffe.basecode.Datum
The Datum class is a simple wrapper to the SimpleDatum class to ensure compatibility with the origina...
Definition: Datum.cs:12

MyCaffe.basecode.GenericList
The GenericList provides a base used to implement a generic list by only implementing the minimum amo...
Definition: GenericList.cs:15

MyCaffe.basecode.GenericList< MemoryItem >::m_rgItems
List< T > m_rgItems
The actual list of items.
Definition: GenericList.cs:19

MyCaffe.basecode.Log
The Log class provides general output in text form.
Definition: Log.cs:13

MyCaffe.basecode.Log.Log
Log(string strSrc)
The Log constructor.
Definition: Log.cs:33

MyCaffe.basecode.PropertySet
Specifies a key-value pair of properties.
Definition: PropertySet.cs:16

MyCaffe.basecode.PropertySet.GetPropertyAsInt
int GetPropertyAsInt(string strName, int nDefault=0)
Returns a property as an integer value.
Definition: PropertySet.cs:287

MyCaffe.basecode.PropertySet.GetPropertyAsBool
bool GetPropertyAsBool(string strName, bool bDefault=false)
Returns a property as a boolean value.
Definition: PropertySet.cs:267

MyCaffe.basecode.PropertySet.GetPropertyAsDouble
double GetPropertyAsDouble(string strName, double dfDefault=0)
Returns a property as an double value.
Definition: PropertySet.cs:307

MyCaffe.basecode.PropertySet.ToString
override string ToString()
Returns the string representation of the properties.
Definition: PropertySet.cs:325

MyCaffe.basecode.SimpleDatum
The SimpleDatum class holds a data input within host memory.
Definition: SimpleDatum.cs:161

MyCaffe.basecode.SimpleDatum.Copy
void Copy(SimpleDatum d, bool bCopyData, int? nHeight=null, int? nWidth=null)
Copy another SimpleDatum into this one.
Definition: SimpleDatum.cs:1294

MyCaffe.basecode.SimpleDatum.Sub
bool Sub(SimpleDatum sd, bool bSetNegativeToZero=false)
Subtract the data of another SimpleDatum from this one, so this = this - sd.
Definition: SimpleDatum.cs:1064

MyCaffe.basecode.SimpleDatum.Zero
void Zero()
Zero out all data in the datum but keep the size and other settings.
Definition: SimpleDatum.cs:1046

MyCaffe.basecode.SimpleDatum.Add
SimpleDatum Add(SimpleDatum d)
Creates a new SimpleDatum and adds another SimpleDatum to it.
Definition: SimpleDatum.cs:2046

MyCaffe.basecode.SimpleDatum.ToString
override string ToString()
Return a string representation of the SimpleDatum.
Definition: SimpleDatum.cs:2444

MyCaffe.basecode.SimpleDatum.DataCriteria
byte[] DataCriteria
Get/set data criteria associated with the data.
Definition: SimpleDatum.cs:2371

MyCaffe.basecode.SimpleDatum.DATA_FORMAT
DATA_FORMAT
Defines the data format of the DebugData and DataCriteria when specified.
Definition: SimpleDatum.cs:223

MyCaffe.basecode.SimpleDatum.DataCriteriaFormat
DATA_FORMAT DataCriteriaFormat
Get/set the data format of the data criteria.
Definition: SimpleDatum.cs:2362

MyCaffe.basecode.Utility
The Utility class provides general utility funtions.
Definition: Utility.cs:35

MyCaffe.basecode.Utility.ConvertVec
static double[] ConvertVec(float[] rgf)
Convert an array of float to an array of generics.
Definition: Utility.cs:550

MyCaffe.common.BlobCollection
The BlobCollection contains a list of Blobs.
Definition: BlobCollection.cs:16

MyCaffe.common.BlobCollection.Dispose
void Dispose()
Release all resource used by the collection and its Blobs.
Definition: BlobCollection.cs:542

MyCaffe.common.BlobCollection.Add
void Add(Blob< T > b)
Add a new Blob to the collection.
Definition: BlobCollection.cs:92

MyCaffe.common.BlobCollection.Accumulate
void Accumulate(CudaDnn< T > cuda, BlobCollection< T > src, bool bAccumulateDiff)
Accumulate the diffs from one BlobCollection into another.
Definition: BlobCollection.cs:283

MyCaffe.common.BlobCollection.SetDiff
void SetDiff(double df)
Set all blob diff to the value specified.
Definition: BlobCollection.cs:311

MyCaffe.common.BlobCollection.Count
int Count
Returns the number of items in the collection.
Definition: BlobCollection.cs:30

MyCaffe.common.Blob
The Blob is the main holder of data that moves through the Layers of the Net.
Definition: Blob.cs:25

MyCaffe.common.Blob.channels
int channels
DEPRECIATED; legacy shape accessor channels: use shape(1) instead.
Definition: Blob.cs:800

MyCaffe.common.Blob.SetData
void SetData(T[] rgData, int nCount=-1, bool bSetCount=true)
Sets a number of items within the Blob's data.
Definition: Blob.cs:1922

MyCaffe.common.Blob.height
int height
DEPRECIATED; legacy shape accessor height: use shape(2) instead.
Definition: Blob.cs:808

MyCaffe.common.Blob.mutable_gpu_data
long mutable_gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1487

MyCaffe.common.Blob.Reshape
void Reshape(int nNum, int nChannels, int nHeight, int nWidth, bool? bUseHalfSize=null)
DEPRECIATED; use
Definition: Blob.cs:442

MyCaffe.common.Blob.std
double std(double? dfMean=null, float[] rgDf=null)
Calculate the standard deviation of the blob data.
Definition: Blob.cs:3007

MyCaffe.common.Blob.mean
double mean(float[] rgDf=null, bool bDiff=false)
Calculate the mean of the blob data.
Definition: Blob.cs:2965

MyCaffe.common.Blob.CopyFrom
void CopyFrom(Blob< T > src, int nSrcOffset, int nDstOffset, int nCount, bool bCopyData, bool bCopyDiff)
Copy from a source Blob.
Definition: Blob.cs:903

MyCaffe.common.Blob.width
int width
DEPRECIATED; legacy shape accessor width: use shape(3) instead.
Definition: Blob.cs:816

MyCaffe.common.Blob.sumsq_data
T sumsq_data()
Calcualte the sum of squares (L2 norm squared) of the data.
Definition: Blob.cs:1730

MyCaffe.common.Blob.NormalizeData
void NormalizeData(double? dfMean=null, double? dfStd=null)
Normalize the blob data by subtracting the mean and dividing by the standard deviation.
Definition: Blob.cs:2942

MyCaffe.common.Blob.count
int count()
Returns the total number of items in the Blob.
Definition: Blob.cs:739

MyCaffe.common.Blob.ReshapeLike
void ReshapeLike(Blob< T > b, bool? bUseHalfSize=null)
Reshape this Blob to have the same shape as another Blob.
Definition: Blob.cs:648

MyCaffe.common.Blob.SetDiff
void SetDiff(double dfVal, int nIdx=-1)
Either sets all of the diff items in the Blob to a given value, or alternatively only sets a single i...
Definition: Blob.cs:1981

MyCaffe.common.Blob.num
int num
DEPRECIATED; legacy shape accessor num: use shape(0) instead.
Definition: Blob.cs:792

MyCaffe.common.Blob.gpu_data
long gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1479

MyCaffe.common.Net
Connects Layer's together into a direct acrylic graph (DAG) specified by a NetParameter
Definition: Net.cs:23

MyCaffe.common.Net.Forward
BlobCollection< T > Forward()
Run forward with the input Blob's already fed separately.
Definition: Net.cs:1445

MyCaffe.common.Net.FindLayer
Layer< T > FindLayer(LayerParameter.LayerType? type, string strName)
Find the layer with the matching type, name and or both.
Definition: Net.cs:2748

MyCaffe.common.Net.output_blobs
BlobCollection< T > output_blobs
Returns the collection of output Blobs.
Definition: Net.cs:2209

MyCaffe.common.Net.ClearParamDiffs
void ClearParamDiffs()
Zero out the diffs of all netw parameters. This should be run before Backward.
Definition: Net.cs:1907

MyCaffe.common.Net.learnable_parameters
BlobCollection< T > learnable_parameters
Returns the learnable parameters.
Definition: Net.cs:2117

MyCaffe.common.ResultCollection
The ResultCollection contains the result of a given CaffeControl::Run.
Definition: ResultCollection.cs:17

MyCaffe.layers.Layer.Backward
void Backward(BlobCollection< T > colTop, List< bool > rgbPropagateDown, BlobCollection< T > colBottom)
Given the top Blob error gradients, compute the bottom Blob error gradients.
Definition: Layer.cs:815

MyCaffe.layers.Layer.Forward
double Forward(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Given the bottom (input) Blobs, this function computes the top (output) Blobs and the loss.
Definition: Layer.cs:728

MyCaffe.layers.Layer.Setup
void Setup(BlobCollection< T > colBottom, BlobCollection< T > colTop)
Implements common Layer setup functionality.
Definition: Layer.cs:439

MyCaffe.layers.MemoryDataLayer
The MemoryDataLayer provides data to the Net from memory. This layer is initialized with the MyCaffe....
Definition: MemoryDataLayer.cs:21

MyCaffe.layers.MemoryDataLayer.AddDatumVector
virtual void AddDatumVector(Datum[] rgData, Datum[] rgClip=null, int nLblAxis=1, bool bReset=false, bool bResizeBatch=false)
This method is used to add a list of Datums to the memory.
Definition: MemoryDataLayer.cs:276

MyCaffe.layers.MemoryDataLayer.OnDataPack
EventHandler< MemoryDataLayerPackDataArgs< T > > OnDataPack
The OnDataPack event fires from within the AddDatumVector method and is used to pack the data into a ...
Definition: MemoryDataLayer.cs:50

MyCaffe.layers.MemoryDataLayerPackDataArgs
The MemoryDataLayerPackDataArgs is passed to the OnDataPack event which fires each time the data rece...
Definition: MemoryDataLayer.cs:602

MyCaffe.layers.MemoryDataLayerPackDataArgs.Label
Blob< T > Label
Returns the label data to fill with ordered label information.
Definition: MemoryDataLayer.cs:657

MyCaffe.layers.MemoryDataLayerPackDataArgs.Clip
Blob< T > Clip
Returns the clip data to fill with ordered data for clipping.
Definition: MemoryDataLayer.cs:649

MyCaffe.layers.MemoryDataLayerPackDataArgs.ClipItems
List< Datum > ClipItems
Returns the raw clip items to use to fill.
Definition: MemoryDataLayer.cs:673

MyCaffe.layers.MemoryDataLayerPackDataArgs.LstmType
LayerParameter.LayerType LstmType
Returns the LSTM type.
Definition: MemoryDataLayer.cs:633

MyCaffe.layers.MemoryDataLayerPackDataArgs.Data
Blob< T > Data
Returns the blob data to fill with ordered data.
Definition: MemoryDataLayer.cs:641

MyCaffe.layers.MemoryDataLayerPackDataArgs.DataItems
List< Datum > DataItems
Returns the raw data items to use to fill.
Definition: MemoryDataLayer.cs:665

MyCaffe.layers.MemoryLossLayerGetLossArgs
The MemoryLossLayerGetLossArgs class is passed to the OnGetLoss event.
Definition: MemoryLossLayer.cs:242

MyCaffe.layers.MemoryLossLayerGetLossArgs.EnableLossUpdate
bool EnableLossUpdate
Get/set enabling the loss update within the backpropagation pass.
Definition: MemoryLossLayer.cs:300

MyCaffe.layers.MemoryLossLayerGetLossArgs.Loss
double Loss
Get/set the externally calculated total loss.
Definition: MemoryLossLayer.cs:291

MyCaffe.layers.MemoryLossLayerGetLossArgs.Bottom
BlobCollection< T > Bottom
Specifies the bottom passed in during the forward pass.
Definition: MemoryLossLayer.cs:275

MyCaffe.layers.MemoryLossLayer
The MemoryLossLayer provides a method of performing a custom loss functionality. Similar to the Memor...
Definition: MemoryLossLayer.cs:21

MyCaffe.layers.MemoryLossLayer.OnGetLoss
EventHandler< MemoryLossLayerGetLossArgs< T > > OnGetLoss
The OnGetLoss event fires during each forward pass. The value returned is saved, and applied on the b...
Definition: MemoryLossLayer.cs:30

MyCaffe.layers.SoftmaxCrossEntropyLossLayer
The SoftmaxCrossEntropyLossLayer computes the cross-entropy (logisitic) loss and is often used for pr...
Definition: SoftmaxCrossEntropyLossLayer.cs:20

MyCaffe.layers.SoftmaxLayer
The SoftmaxLayer computes the softmax function. This layer is initialized with the MyCaffe....
Definition: SoftmaxLayer.cs:24

MyCaffe.param.LayerParameter
Specifies the base parameter for all layers.
Definition: LayerParameter.cs:24

MyCaffe.param.LayerParameter.loss_weight
List< double > loss_weight
Specifies the loss weight.
Definition: LayerParameter.cs:1955

MyCaffe.param.LayerParameter.LayerType
LayerType
Specifies the layer type.
Definition: LayerParameter.cs:110

MyCaffe.param.LayerParameter.loss_param
LossParameter loss_param
Returns the parameter set when initialized with LayerType.LOSS
Definition: LayerParameter.cs:2027

MyCaffe.param.LossParameter
Stores the parameters used by loss layers.
Definition: LossParameter.cs:16

MyCaffe.param.LossParameter.NormalizationMode
NormalizationMode
How to normalize the loss for loss layers that aggregate across batches, spatial dimensions,...
Definition: LossParameter.cs:27

MyCaffe.param.LossParameter.normalization
NormalizationMode? normalization
Specifies the normalization mode (default = VALID).
Definition: LossParameter.cs:81

MyCaffe.solvers.Solver
An interface for classes that perform optimization on Nets - this class serves as the base class for ...
Definition: Solver.cs:28

MyCaffe.solvers.Solver.Step
bool Step(int nIters, TRAIN_STEP step=TRAIN_STEP.NONE, bool bZeroDiffs=true, bool bApplyUpdates=true, bool bDisableOutput=false, bool bDisableProgress=false, double? dfLossOverride=null, bool? bAllowSnapshot=null)
Steps a set of iterations through a training cycle.
Definition: Solver.cs:818

MyCaffe.solvers.Solver.ApplyUpdate
abstract double ApplyUpdate(int nIterationOverride=-1)
Make and apply the update value for the current iteration.

MyCaffe.trainers.InitializeArgs
The InitializeArgs is passed to the OnInitialize event.
Definition: EventArgs.cs:90

MyCaffe.trainers.WaitArgs
The WaitArgs is passed to the OnWait event.
Definition: EventArgs.cs:65

MyCaffe.trainers.pg.st.TrainerPG
The TrainerPG implements a simple Policy Gradient trainer inspired by Andrej Karpathy's blog posed re...
Definition: TrainerPG.cs:26

MyCaffe.trainers.pg.st.TrainerPG.Train
bool Train(int nN, ITERATOR_TYPE type, TRAIN_STEP step)
Train the network using a modified PG training algorithm optimized for GPU use.
Definition: TrainerPG.cs:158

MyCaffe.trainers.pg.st.TrainerPG.Dispose
void Dispose()
Releases all resources used.
Definition: TrainerPG.cs:50

MyCaffe.trainers.pg.st.TrainerPG.Run
byte[] Run(int nN, PropertySet runProp, out string type)
Run a set of iterations and return the resuts.
Definition: TrainerPG.cs:116

MyCaffe.trainers.pg.st.TrainerPG.Initialize
bool Initialize()
Initialize the trainer.
Definition: TrainerPG.cs:58

MyCaffe.trainers.pg.st.TrainerPG.Shutdown
bool Shutdown(int nWait)
Shutdown the trainer.
Definition: TrainerPG.cs:82

MyCaffe.trainers.pg.st.TrainerPG.RunOne
ResultCollection RunOne(int nDelay=1000)
Run a single cycle on the environment after the delay.
Definition: TrainerPG.cs:100

MyCaffe.trainers.pg.st.TrainerPG.TrainerPG
TrainerPG(MyCaffeControl< T > mycaffe, PropertySet properties, CryptoRandom random, IxTrainerCallback icallback)
The constructor.
Definition: TrainerPG.cs:39

MyCaffe.trainers.pg.st.TrainerPG.Test
bool Test(int nN, ITERATOR_TYPE type)
Run the test cycle - currently this is not implemented.
Definition: TrainerPG.cs:132

MyCaffe.trainers.IxTrainerCallback
The IxTrainerCallback provides functions used by each trainer to 'call-back' to the parent for inform...
Definition: Interfaces.cs:303

MyCaffe.trainers.IxTrainerRL
The IxTrainerRL interface is implemented by each RL Trainer.
Definition: Interfaces.cs:257

MyCaffe.basecode
The MyCaffe.basecode contains all generic types used throughout MyCaffe.
Definition: Annotation.cs:12

MyCaffe.basecode.Phase
Phase
Defines the Phase under which to run a Net.
Definition: Interfaces.cs:61

MyCaffe.common
The MyCaffe.common namespace contains common MyCaffe classes.
Definition: BatchInput.cs:8

MyCaffe.common.BLOB_TYPE
BLOB_TYPE
Defines the tpe of data held by a given Blob.
Definition: Interfaces.cs:62

MyCaffe.common.TRAIN_STEP
TRAIN_STEP
Defines the training stepping method (if any).
Definition: Interfaces.cs:131

MyCaffe.fillers
The MyCaffe.fillers namespace contains all fillers including the Filler class.
Definition: BilinearFiller.cs:10

MyCaffe.layers
The MyCaffe.layers namespace contains all layers that have a solidified code base,...
Definition: LayerFactory.cs:15

MyCaffe.param
The MyCaffe.param namespace contains parameters used to create models.
Definition: AttentionParameter.cs:9

MyCaffe.solvers
The MyCaffe.solvers namespace contains all solver classes, including the base Solver.
Definition: AdaDeltaSolver.cs:13

MyCaffe.trainers.pg.st
Definition: TrainerPG.cs:16

MyCaffe.trainers.ITERATOR_TYPE
ITERATOR_TYPE
Specifies the iterator type to use.
Definition: Interfaces.cs:22

MyCaffe
The MyCaffe namespace contains the main body of MyCaffe code that closesly tracks the C++ Caffe open-...
Definition: Annotation.cs:12

System
Definition: Component.cs:11