mycaffe/html/pg_8simple_2_trainer_p_g_8cs_source.html

using System;

using System.Collections.Generic;

using System.Drawing;

using System.Linq;

using System.Text;

using System.Threading;

using System.Threading.Tasks;

using MyCaffe.basecode;

using MyCaffe.common;

using MyCaffe.fillers;

using MyCaffe.layers;

using MyCaffe.param;

using MyCaffe.solvers;


namespace MyCaffe.trainers.pg.simple

{

    public class TrainerPG<T> : IxTrainerRL, IDisposable

    {

        IxTrainerCallback m_icallback;

        CryptoRandom m_random = new CryptoRandom();

        MyCaffeControl<T> m_mycaffe;

        PropertySet m_properties;


        public TrainerPG(MyCaffeControl<T> mycaffe, PropertySet properties, CryptoRandom random, IxTrainerCallback icallback)

        {

            m_icallback = icallback;

            m_mycaffe = mycaffe;

            m_properties = properties;

            m_random = random;

        }


        public void Dispose()

        {

        }


        public bool Initialize()

        {

            m_mycaffe.CancelEvent.Reset();

            m_icallback.OnInitialize(new InitializeArgs(m_mycaffe));

            return true;

        }


        private void wait(int nWait)

        {

            int nWaitInc = 250;

            int nTotalWait = 0;


            while (nTotalWait < nWait)

            {

                m_icallback.OnWait(new WaitArgs(nWaitInc));

                nTotalWait += nWaitInc;

            }

        }


        public bool Shutdown(int nWait)

        {

            if (m_mycaffe != null)

            {

                m_mycaffe.CancelEvent.Set();

                wait(nWait);

            }


            m_icallback.OnShutdown();


            return true;

        }


        public ResultCollection RunOne(int nDelay = 1000)

        {

            m_mycaffe.CancelEvent.Reset();

            Agent<T> agent = new Agent<T>(m_icallback, m_mycaffe, m_properties, m_random, Phase.TRAIN);

            agent.Run(Phase.TEST, 1, ITERATOR_TYPE.ITERATION);

            agent.Dispose();

            return null;

        }


        public byte[] Run(int nN, PropertySet runProp, out string type)

        {

            m_mycaffe.CancelEvent.Reset();

            Agent<T> agent = new Agent<T>(m_icallback, m_mycaffe, m_properties, m_random, Phase.RUN);

            byte[] rgResults = agent.Run(nN, out type);

            agent.Dispose();


            return rgResults;

        }


        public bool Test(int nN, ITERATOR_TYPE type)

        {

            int nDelay = 1000;

            string strProp = m_properties.ToString();


            // Turn off the num-skip to run at normal speed.

            strProp += "EnableNumSkip=False;";

            PropertySet properties = new PropertySet(strProp);


            m_mycaffe.CancelEvent.Reset();

            Agent<T> agent = new Agent<T>(m_icallback, m_mycaffe, properties, m_random, Phase.TRAIN);

            agent.Run(Phase.TEST, nN, type);


            agent.Dispose();

            Shutdown(nDelay);


            return true;

        }


        public bool Train(int nN, ITERATOR_TYPE type, TRAIN_STEP step)

        {

            if (step != TRAIN_STEP.NONE)

                throw new Exception("The simple traininer does not support stepping - use the 'PG.MT' trainer instead.");


            m_mycaffe.CancelEvent.Reset();

            Agent<T> agent = new Agent<T>(m_icallback, m_mycaffe, m_properties, m_random, Phase.TRAIN);

            agent.Run(Phase.TRAIN, nN, type);

            agent.Dispose();


            return false;

        }

    }


    class Agent<T> : IDisposable

    {

        IxTrainerCallback m_icallback;

        Brain<T> m_brain;

        PropertySet m_properties;

        CryptoRandom m_random;

        float m_fGamma;

        bool m_bAllowDiscountReset = false;

        bool m_bUseRawInput = false;


        public Agent(IxTrainerCallback icallback, MyCaffeControl<T> mycaffe, PropertySet properties, CryptoRandom random, Phase phase)

        {

            m_icallback = icallback;

            m_brain = new Brain<T>(mycaffe, properties, random, phase);

            m_properties = properties;

            m_random = random;


            m_fGamma = (float)properties.GetPropertyAsDouble("Gamma", 0.99);

            m_bAllowDiscountReset = properties.GetPropertyAsBool("AllowDiscountReset", false);

            m_bUseRawInput = properties.GetPropertyAsBool("UseRawInput", false);

        }


        public void Dispose()

        {

            if (m_brain != null)

            {

                m_brain.Dispose();

                m_brain = null;

            }

        }


        private StateBase getData(Phase phase, int nAction)

        {

            GetDataArgs args = m_brain.getDataArgs(phase, nAction);

            m_icallback.OnGetData(args);

            return args.State;

        }


        private void updateStatus(int nIteration, int nEpisodeCount, double dfRewardSum, double dfRunningReward)

        {

            GetStatusArgs args = new GetStatusArgs(0, nIteration, nEpisodeCount, 1000000, dfRunningReward, dfRewardSum, 0, 0, 0, 0);

            m_icallback.OnUpdateStatus(args);

        }


        public byte[] Run(int nIterations, out string type)

        {

            IxTrainerCallbackRNN icallback = m_icallback as IxTrainerCallbackRNN;

            if (icallback == null)

                throw new Exception("The Run method requires an IxTrainerCallbackRNN interface to convert the results into the native format!");


            StateBase s = getData(Phase.RUN, -1);

            int nIteration = 0;

            List<float> rgResults = new List<float>();


            while (!m_brain.Cancel.WaitOne(0) && (nIterations == -1 || nIteration < nIterations))

            {

                // Preprocess the observation.

                SimpleDatum x = m_brain.Preprocess(s, m_bUseRawInput);


                // Forward the policy network and sample an action.

                float fAprob;

                int action = m_brain.act(x, out fAprob);


                rgResults.Add(s.Data.TimeStamp.ToFileTime());

                rgResults.Add(s.Data.GetDataAtF(0));

                rgResults.Add(action);


                // Take the next step using the action

                StateBase s_ = getData(Phase.RUN, action);

                nIteration++;

            }


            ConvertOutputArgs args = new ConvertOutputArgs(nIterations, rgResults.ToArray());

            icallback.OnConvertOutput(args);


            type = args.RawType;

            return args.RawOutput;

        }


        private bool isAtIteration(int nN, ITERATOR_TYPE type, int nIteration, int nEpisode)

        {

            if (nN == -1)

                return false;


            if (type == ITERATOR_TYPE.EPISODE)

            {

                if (nEpisode < nN)

                    return false;


                return true;

            }

            else

            {

                if (nIteration < nN)

                    return false;


                return true;

            }

        }


        public void Run(Phase phase, int nN, ITERATOR_TYPE type)

        {

            MemoryCollection m_rgMemory = new MemoryCollection();

            double? dfRunningReward = null;

            double dfEpisodeReward = 0;

            int nEpisode = 0;

            int nIteration = 0;


            StateBase s = getData(phase, -1);


            if (s.Clip != null)

                throw new Exception("The PG.SIMPLE trainer does not support recurrent layers or clip data, use the 'PG.ST' or 'PG.MT' trainer instead.");


            while (!m_brain.Cancel.WaitOne(0) && !isAtIteration(nN, type, nIteration, nEpisode))

            {

                // Preprocess the observation.

                SimpleDatum x = m_brain.Preprocess(s, m_bUseRawInput);


                // Forward the policy network and sample an action.

                float fAprob;

                int action = m_brain.act(x, out fAprob);


                // Take the next step using the action

                StateBase s_ = getData(phase, action);

                dfEpisodeReward += s_.Reward;


                if (phase == Phase.TRAIN)

                {

                    // Build up episode memory, using reward for taking the action.

                    m_rgMemory.Add(new MemoryItem(s, x, action, fAprob, (float)s_.Reward));


                    // An episode has finished.

                    if (s_.Done)

                    {

                        nEpisode++;

                        nIteration++;


                        m_brain.Reshape(m_rgMemory);


                        // Compute the discounted reward (backwards through time)

                        float[] rgDiscountedR = m_rgMemory.GetDiscountedRewards(m_fGamma, m_bAllowDiscountReset);

                        // Rewards are standardized when set to be unit normal (helps control the gradient estimator variance)

                        m_brain.SetDiscountedR(rgDiscountedR);


                        // Modulate the gradient with the advantage (PG magic happens right here.)

                        float[] rgDlogp = m_rgMemory.GetPolicyGradients();

                        // discounted R applied to policy gradient within loss function, just before the backward pass.

                        m_brain.SetPolicyGradients(rgDlogp);


                        // Train for one iteration, which triggers the loss function.

                        List<Datum> rgData = m_rgMemory.GetData();

                        m_brain.SetData(rgData);

                        m_brain.Train(nIteration);


                        // Update reward running

                        if (!dfRunningReward.HasValue)

                            dfRunningReward = dfEpisodeReward;

                        else

                            dfRunningReward = dfRunningReward * 0.99 + dfEpisodeReward * 0.01;


                        updateStatus(nIteration, nEpisode, dfEpisodeReward, dfRunningReward.Value);

                        dfEpisodeReward = 0;


                        s = getData(phase, -1);

                        m_rgMemory.Clear();

                    }

                    else

                    {

                        s = s_;

                    }

                }

                else

                {

                    if (s_.Done)

                    {

                        nEpisode++;


                        // Update reward running

                        if (!dfRunningReward.HasValue)

                            dfRunningReward = dfEpisodeReward;

                        else

                            dfRunningReward = dfRunningReward * 0.99 + dfEpisodeReward * 0.01;


                        updateStatus(nIteration, nEpisode, dfEpisodeReward, dfRunningReward.Value);

                        dfEpisodeReward = 0;


                        s = getData(phase, -1);

                    }

                    else

                    {

                        s = s_;

                    }


                    nIteration++;

                }

            }

        }

    }


    class Brain<T> : IDisposable

    {

        MyCaffeControl<T> m_mycaffe;

        Net<T> m_net;

        Solver<T> m_solver;

        MemoryDataLayer<T> m_memData;

        MemoryLossLayer<T> m_memLoss;

        PropertySet m_properties;

        CryptoRandom m_random;

        Blob<T> m_blobDiscountedR;

        Blob<T> m_blobPolicyGradient;

        bool m_bSkipLoss;

        int m_nMiniBatch = 10;

        SimpleDatum m_sdLast = null;


        public Brain(MyCaffeControl<T> mycaffe, PropertySet properties, CryptoRandom random, Phase phase)

        {

            m_mycaffe = mycaffe;

            m_net = mycaffe.GetInternalNet(phase);

            m_solver = mycaffe.GetInternalSolver();

            m_properties = properties;

            m_random = random;


            m_memData = m_net.FindLayer(LayerParameter.LayerType.MEMORYDATA, null) as MemoryDataLayer<T>;

            m_memLoss = m_net.FindLayer(LayerParameter.LayerType.MEMORY_LOSS, null) as MemoryLossLayer<T>;

            SoftmaxLayer<T> softmax = m_net.FindLayer(LayerParameter.LayerType.SOFTMAX, null) as SoftmaxLayer<T>;


            if (softmax != null)

                throw new Exception("The PG.SIMPLE trainer does not support the Softmax layer, use the 'PG.ST' or 'PG.MT' trainer instead.");


            if (m_memData == null)

                throw new Exception("Could not find the MemoryData Layer!");


            if (m_memLoss == null)

                throw new Exception("Could not find the MemoryLoss Layer!");


            m_memLoss.OnGetLoss += memLoss_OnGetLoss;


            m_blobDiscountedR = new Blob<T>(mycaffe.Cuda, mycaffe.Log);

            m_blobPolicyGradient = new Blob<T>(mycaffe.Cuda, mycaffe.Log);


            int nMiniBatch = mycaffe.CurrentProject.GetBatchSize(phase);

            if (nMiniBatch != 0)

                m_nMiniBatch = nMiniBatch;


            m_nMiniBatch = m_properties.GetPropertyAsInt("MiniBatch", m_nMiniBatch);

        }


        private void dispose(ref Blob<T> b)

        {

            if (b != null)

            {

                b.Dispose();

                b = null;

            }

        }


        public void Dispose()

        {

            m_memLoss.OnGetLoss -= memLoss_OnGetLoss;

            dispose(ref m_blobDiscountedR);

            dispose(ref m_blobPolicyGradient);

        }


        public void Reshape(MemoryCollection col)

        {

            int nNum = col.Count;

            int nChannels = col[0].Data.Channels;

            int nHeight = col[0].Data.Height;

            int nWidth = col[0].Data.Height;


            m_blobDiscountedR.Reshape(nNum, 1, 1, 1);

            m_blobPolicyGradient.Reshape(nNum, 1, 1, 1);

        }


        public void SetDiscountedR(float[] rg)

        {

            double dfMean = m_blobDiscountedR.mean(rg);

            double dfStd = m_blobDiscountedR.std(dfMean, rg);

            m_blobDiscountedR.SetData(Utility.ConvertVec<T>(rg));

            m_blobDiscountedR.NormalizeData(dfMean, dfStd);

        }


        public void SetPolicyGradients(float[] rg)

        {

            m_blobPolicyGradient.SetData(Utility.ConvertVec<T>(rg));

        }


        public void SetData(List<Datum> rgData)

        {

            m_memData.AddDatumVector(rgData, null, 1, true, true);

        }


        public GetDataArgs getDataArgs(Phase phase, int nAction)

        {

            bool bReset = (nAction == -1) ? true : false;

            return new GetDataArgs(phase, 0, m_mycaffe, m_mycaffe.Log, m_mycaffe.CancelEvent, bReset, nAction, false);

        }


        public Log Log

        {

            get { return m_mycaffe.Log; }

        }


        public CancelEvent Cancel

        {

            get { return m_mycaffe.CancelEvent; }

        }


        public SimpleDatum Preprocess(StateBase s, bool bUseRawInput)

        {

            SimpleDatum sd = new SimpleDatum(s.Data, true);


            if (bUseRawInput)

                return sd;


            if (m_sdLast == null)

                sd.Zero();

            else

                sd.Sub(m_sdLast);


            m_sdLast = s.Data;


            return sd;

        }


        public int act(SimpleDatum sd, out float fAprob)

        {

            List<Datum> rgData = new List<Datum>();

            rgData.Add(new Datum(sd));

            double dfLoss;


            m_memData.AddDatumVector(rgData, null, 1, true, true);

            m_bSkipLoss = true;

            BlobCollection<T> res = m_net.Forward(out dfLoss);

            m_bSkipLoss = false;

            float[] rgfAprob = null;


            for (int i = 0; i < res.Count; i++)

            {

                if (res[i].type != BLOB_TYPE.LOSS)

                {

                    rgfAprob = Utility.ConvertVecF<T>(res[i].update_cpu_data());

                    break;

                }

            }


            if (rgfAprob == null)

                throw new Exception("Could not find a non-loss output!  Your model should output the loss and the action probabilities.");


            if (rgfAprob.Length != 1)

                throw new Exception("The simple policy gradient only supports a single data output!");


            fAprob = rgfAprob[0];


            // Roll the dice!

            if (m_random.NextDouble() < (double)fAprob)

                return 0;

            else

                return 1;

        }


        public void Train(int nIteration)

        {

            m_mycaffe.Log.Enable = false;

            m_solver.Step(1, TRAIN_STEP.NONE, false, false, true, true);  // accumulate grad over batch


            if (nIteration % m_nMiniBatch == 0)

            {

                m_solver.ApplyUpdate(nIteration);

                m_net.ClearParamDiffs();

            }


            m_mycaffe.Log.Enable = true;

        }


        private void memLoss_OnGetLoss(object sender, MemoryLossLayerGetLossArgs<T> e)

        {

            if (m_bSkipLoss)

                return;


            int nCount = m_blobPolicyGradient.count();

            long hPolicyGrad = m_blobPolicyGradient.mutable_gpu_data;

            long hBottomDiff = e.Bottom[0].mutable_gpu_diff;

            long hDiscountedR = m_blobDiscountedR.gpu_data;


            // Calculate the actual loss.

            double dfSumSq = Utility.ConvertVal<T>(m_blobPolicyGradient.sumsq_data());

            double dfMean = dfSumSq;


            e.Loss = dfMean;

            e.EnableLossUpdate = false; // apply gradients to bottom directly.


            // Modulate the gradient with the advantage (PG magic happens right here.)

            m_mycaffe.Cuda.mul(nCount, hPolicyGrad, hDiscountedR, hPolicyGrad);

            m_mycaffe.Cuda.copy(nCount, hPolicyGrad, hBottomDiff);

            m_mycaffe.Cuda.mul_scalar(nCount, -1.0, hBottomDiff);

        }

    }


    class MemoryCollection : GenericList<MemoryItem>

    {

        public MemoryCollection()

        {

        }


        public float[] GetDiscountedRewards(float fGamma, bool bAllowReset)

        {

            float fRunningAdd = 0;

            float[] rgR = m_rgItems.Select(p => p.Reward).ToArray();

            float[] rgDiscountedR = new float[rgR.Length];


            for (int t = Count - 1; t >= 0; t--)

            {

                if (bAllowReset && rgR[t] != 0)

                    fRunningAdd = 0;


                fRunningAdd = fRunningAdd * fGamma + rgR[t];

                rgDiscountedR[t] = fRunningAdd;

            }


            return rgDiscountedR;

        }


        public float[] GetPolicyGradients()

        {

            return m_rgItems.Select(p => p.dlogps).ToArray();

        }


        public List<Datum> GetData()

        {

            List<Datum> rgData = new List<Datum>();


            for (int i = 0; i < m_rgItems.Count; i++)

            {

                rgData.Add(new Datum(m_rgItems[i].Data));

            }


            return rgData;

        }


        public List<Datum> GetClip()

        {

            return null;

        }

    }


    class MemoryItem

    {

        StateBase m_state;

        SimpleDatum m_x;

        int m_nAction;

        float m_fAprob;

        float m_fReward;


        public MemoryItem(StateBase s, SimpleDatum x, int nAction, float fAprob, float fReward)

        {

            m_state = s;

            m_x = x;

            m_nAction = nAction;

            m_fAprob = fAprob;

            m_fReward = fReward;

        }


        public StateBase State

        {

            get { return m_state; }

        }


        public SimpleDatum Data

        {

            get { return m_x; }

        }


        public int Action

        {

            get { return m_nAction; }

        }


        public float Reward

        {

            get { return m_fReward; }

        }


        public float dlogps

        {

            get

            {

                float fY = 0;


                if (m_nAction == 0)

                    fY = 1;


                return fY - m_fAprob;

            }

        }


        public override string ToString()

        {

            return "action = " + m_nAction.ToString() + " reward = " + m_fReward.ToString("N2") + " aprob = " + m_fAprob.ToString("N5") + " dlogps = " + dlogps.ToString("N5");

        }

    }

}

MyCaffe.MyCaffeControl
The MyCaffeControl is the main object used to manage all training, testing and running of the MyCaffe...
Definition: MyCaffeControl.cs:35

MyCaffe.MyCaffeControl.CancelEvent
CancelEvent CancelEvent
Returns the CancelEvent used.
Definition: MyCaffeControl.cs:648

MyCaffe.basecode.CancelEvent
The CancelEvent provides an extension to the manual cancel event that allows for overriding the manua...
Definition: CancelEvent.cs:17

MyCaffe.basecode.CancelEvent.Reset
void Reset()
Resets the event clearing any signaled state.
Definition: CancelEvent.cs:279

MyCaffe.basecode.CancelEvent.CancelEvent
CancelEvent()
The CancelEvent constructor.
Definition: CancelEvent.cs:28

MyCaffe.basecode.CancelEvent.Set
void Set()
Sets the event to the signaled state.
Definition: CancelEvent.cs:270

MyCaffe.basecode.CryptoRandom
The CryptoRandom is a random number generator that can use either the standard .Net Random objec or t...
Definition: CryptoRandom.cs:14

MyCaffe.basecode.CryptoRandom.NextDouble
double NextDouble()
Returns a random double within the range .
Definition: CryptoRandom.cs:83

MyCaffe.basecode.Datum
The Datum class is a simple wrapper to the SimpleDatum class to ensure compatibility with the origina...
Definition: Datum.cs:12

MyCaffe.basecode.GenericList
The GenericList provides a base used to implement a generic list by only implementing the minimum amo...
Definition: GenericList.cs:15

MyCaffe.basecode.GenericList< MemoryItem >::m_rgItems
List< T > m_rgItems
The actual list of items.
Definition: GenericList.cs:19

MyCaffe.basecode.Log
The Log class provides general output in text form.
Definition: Log.cs:13

MyCaffe.basecode.Log.Log
Log(string strSrc)
The Log constructor.
Definition: Log.cs:33

MyCaffe.basecode.PropertySet
Specifies a key-value pair of properties.
Definition: PropertySet.cs:16

MyCaffe.basecode.PropertySet.GetPropertyAsInt
int GetPropertyAsInt(string strName, int nDefault=0)
Returns a property as an integer value.
Definition: PropertySet.cs:287

MyCaffe.basecode.PropertySet.GetPropertyAsBool
bool GetPropertyAsBool(string strName, bool bDefault=false)
Returns a property as a boolean value.
Definition: PropertySet.cs:267

MyCaffe.basecode.PropertySet.GetPropertyAsDouble
double GetPropertyAsDouble(string strName, double dfDefault=0)
Returns a property as an double value.
Definition: PropertySet.cs:307

MyCaffe.basecode.PropertySet.ToString
override string ToString()
Returns the string representation of the properties.
Definition: PropertySet.cs:325

MyCaffe.basecode.SimpleDatum
The SimpleDatum class holds a data input within host memory.
Definition: SimpleDatum.cs:161

MyCaffe.basecode.SimpleDatum.Sub
bool Sub(SimpleDatum sd, bool bSetNegativeToZero=false)
Subtract the data of another SimpleDatum from this one, so this = this - sd.
Definition: SimpleDatum.cs:1064

MyCaffe.basecode.SimpleDatum.Zero
void Zero()
Zero out all data in the datum but keep the size and other settings.
Definition: SimpleDatum.cs:1046

MyCaffe.basecode.SimpleDatum.Add
SimpleDatum Add(SimpleDatum d)
Creates a new SimpleDatum and adds another SimpleDatum to it.
Definition: SimpleDatum.cs:2046

MyCaffe.basecode.SimpleDatum.ToString
override string ToString()
Return a string representation of the SimpleDatum.
Definition: SimpleDatum.cs:2444

MyCaffe.basecode.Utility
The Utility class provides general utility funtions.
Definition: Utility.cs:35

MyCaffe.basecode.Utility.ConvertVec
static double[] ConvertVec(float[] rgf)
Convert an array of float to an array of generics.
Definition: Utility.cs:550

MyCaffe.common.BlobCollection
The BlobCollection contains a list of Blobs.
Definition: BlobCollection.cs:16

MyCaffe.common.BlobCollection.Count
int Count
Returns the number of items in the collection.
Definition: BlobCollection.cs:30

MyCaffe.common.Blob
The Blob is the main holder of data that moves through the Layers of the Net.
Definition: Blob.cs:25

MyCaffe.common.Blob.SetData
void SetData(T[] rgData, int nCount=-1, bool bSetCount=true)
Sets a number of items within the Blob's data.
Definition: Blob.cs:1922

MyCaffe.common.Blob.mutable_gpu_data
long mutable_gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1487

MyCaffe.common.Blob.Reshape
void Reshape(int nNum, int nChannels, int nHeight, int nWidth, bool? bUseHalfSize=null)
DEPRECIATED; use
Definition: Blob.cs:442

MyCaffe.common.Blob.std
double std(double? dfMean=null, float[] rgDf=null)
Calculate the standard deviation of the blob data.
Definition: Blob.cs:3007

MyCaffe.common.Blob.mean
double mean(float[] rgDf=null, bool bDiff=false)
Calculate the mean of the blob data.
Definition: Blob.cs:2965

MyCaffe.common.Blob.sumsq_data
T sumsq_data()
Calcualte the sum of squares (L2 norm squared) of the data.
Definition: Blob.cs:1730

MyCaffe.common.Blob.NormalizeData
void NormalizeData(double? dfMean=null, double? dfStd=null)
Normalize the blob data by subtracting the mean and dividing by the standard deviation.
Definition: Blob.cs:2942

MyCaffe.common.Blob.count
int count()
Returns the total number of items in the Blob.
Definition: Blob.cs:739

MyCaffe.common.Blob.gpu_data
long gpu_data
Returns the data GPU handle used by the CudaDnn connection.
Definition: Blob.cs:1479

MyCaffe.common.Net
Connects Layer's together into a direct acrylic graph (DAG) specified by a NetParameter
Definition: Net.cs:23

MyCaffe.common.Net.Forward
BlobCollection< T > Forward()
Run forward with the input Blob's already fed separately.
Definition: Net.cs:1445

MyCaffe.common.Net.FindLayer
Layer< T > FindLayer(LayerParameter.LayerType? type, string strName)
Find the layer with the matching type, name and or both.
Definition: Net.cs:2748

MyCaffe.common.Net.ClearParamDiffs
void ClearParamDiffs()
Zero out the diffs of all netw parameters. This should be run before Backward.
Definition: Net.cs:1907

MyCaffe.common.ResultCollection
The ResultCollection contains the result of a given CaffeControl::Run.
Definition: ResultCollection.cs:17

MyCaffe.layers.MemoryDataLayer
The MemoryDataLayer provides data to the Net from memory. This layer is initialized with the MyCaffe....
Definition: MemoryDataLayer.cs:21

MyCaffe.layers.MemoryDataLayer.AddDatumVector
virtual void AddDatumVector(Datum[] rgData, Datum[] rgClip=null, int nLblAxis=1, bool bReset=false, bool bResizeBatch=false)
This method is used to add a list of Datums to the memory.
Definition: MemoryDataLayer.cs:276

MyCaffe.layers.MemoryLossLayerGetLossArgs
The MemoryLossLayerGetLossArgs class is passed to the OnGetLoss event.
Definition: MemoryLossLayer.cs:242

MyCaffe.layers.MemoryLossLayerGetLossArgs.EnableLossUpdate
bool EnableLossUpdate
Get/set enabling the loss update within the backpropagation pass.
Definition: MemoryLossLayer.cs:300

MyCaffe.layers.MemoryLossLayerGetLossArgs.Loss
double Loss
Get/set the externally calculated total loss.
Definition: MemoryLossLayer.cs:291

MyCaffe.layers.MemoryLossLayerGetLossArgs.Bottom
BlobCollection< T > Bottom
Specifies the bottom passed in during the forward pass.
Definition: MemoryLossLayer.cs:275

MyCaffe.layers.MemoryLossLayer
The MemoryLossLayer provides a method of performing a custom loss functionality. Similar to the Memor...
Definition: MemoryLossLayer.cs:21

MyCaffe.layers.MemoryLossLayer.OnGetLoss
EventHandler< MemoryLossLayerGetLossArgs< T > > OnGetLoss
The OnGetLoss event fires during each forward pass. The value returned is saved, and applied on the b...
Definition: MemoryLossLayer.cs:30

MyCaffe.layers.SoftmaxLayer
The SoftmaxLayer computes the softmax function. This layer is initialized with the MyCaffe....
Definition: SoftmaxLayer.cs:24

MyCaffe.param.LayerParameter
Specifies the base parameter for all layers.
Definition: LayerParameter.cs:24

MyCaffe.param.LayerParameter.LayerType
LayerType
Specifies the layer type.
Definition: LayerParameter.cs:110

MyCaffe.solvers.Solver
An interface for classes that perform optimization on Nets - this class serves as the base class for ...
Definition: Solver.cs:28

MyCaffe.solvers.Solver.Step
bool Step(int nIters, TRAIN_STEP step=TRAIN_STEP.NONE, bool bZeroDiffs=true, bool bApplyUpdates=true, bool bDisableOutput=false, bool bDisableProgress=false, double? dfLossOverride=null, bool? bAllowSnapshot=null)
Steps a set of iterations through a training cycle.
Definition: Solver.cs:818

MyCaffe.solvers.Solver.ApplyUpdate
abstract double ApplyUpdate(int nIterationOverride=-1)
Make and apply the update value for the current iteration.

MyCaffe.trainers.InitializeArgs
The InitializeArgs is passed to the OnInitialize event.
Definition: EventArgs.cs:90

MyCaffe.trainers.WaitArgs
The WaitArgs is passed to the OnWait event.
Definition: EventArgs.cs:65

MyCaffe.trainers.pg.simple.TrainerPG
The TrainerPG implements a simple Policy Gradient trainer inspired by Andrej Karpathy's blog posed re...
Definition: TrainerPG.cs:26

MyCaffe.trainers.pg.simple.TrainerPG.Run
byte[] Run(int nN, PropertySet runProp, out string type)
Run a set of iterations and return the resuts.
Definition: TrainerPG.cs:116

MyCaffe.trainers.pg.simple.TrainerPG.Initialize
bool Initialize()
Initialize the trainer.
Definition: TrainerPG.cs:58

MyCaffe.trainers.pg.simple.TrainerPG.Test
bool Test(int nN, ITERATOR_TYPE type)
Run the test cycle - currently this is not implemented.
Definition: TrainerPG.cs:132

MyCaffe.trainers.pg.simple.TrainerPG.Train
bool Train(int nN, ITERATOR_TYPE type, TRAIN_STEP step)
Train the network using a modified PG training algorithm optimized for GPU use.
Definition: TrainerPG.cs:158

MyCaffe.trainers.pg.simple.TrainerPG.TrainerPG
TrainerPG(MyCaffeControl< T > mycaffe, PropertySet properties, CryptoRandom random, IxTrainerCallback icallback)
The constructor.
Definition: TrainerPG.cs:39

MyCaffe.trainers.pg.simple.TrainerPG.Shutdown
bool Shutdown(int nWait)
Shutdown the trainer.
Definition: TrainerPG.cs:82

MyCaffe.trainers.pg.simple.TrainerPG.Dispose
void Dispose()
Releases all resources used.
Definition: TrainerPG.cs:50

MyCaffe.trainers.pg.simple.TrainerPG.RunOne
ResultCollection RunOne(int nDelay=1000)
Run a single cycle on the environment after the delay.
Definition: TrainerPG.cs:100

MyCaffe.trainers.IxTrainerCallback
The IxTrainerCallback provides functions used by each trainer to 'call-back' to the parent for inform...
Definition: Interfaces.cs:303

MyCaffe.trainers.IxTrainerRL
The IxTrainerRL interface is implemented by each RL Trainer.
Definition: Interfaces.cs:257

MyCaffe.basecode
The MyCaffe.basecode contains all generic types used throughout MyCaffe.
Definition: Annotation.cs:12

MyCaffe.basecode.Phase
Phase
Defines the Phase under which to run a Net.
Definition: Interfaces.cs:61

MyCaffe.common
The MyCaffe.common namespace contains common MyCaffe classes.
Definition: BatchInput.cs:8

MyCaffe.common.BLOB_TYPE
BLOB_TYPE
Defines the tpe of data held by a given Blob.
Definition: Interfaces.cs:62

MyCaffe.common.TRAIN_STEP
TRAIN_STEP
Defines the training stepping method (if any).
Definition: Interfaces.cs:131

MyCaffe.fillers
The MyCaffe.fillers namespace contains all fillers including the Filler class.
Definition: BilinearFiller.cs:10

MyCaffe.layers
The MyCaffe.layers namespace contains all layers that have a solidified code base,...
Definition: LayerFactory.cs:15

MyCaffe.param
The MyCaffe.param namespace contains parameters used to create models.
Definition: AttentionParameter.cs:9

MyCaffe.solvers
The MyCaffe.solvers namespace contains all solver classes, including the base Solver.
Definition: AdaDeltaSolver.cs:13

MyCaffe.trainers.pg.simple
Definition: TrainerPG.cs:16

MyCaffe.trainers.ITERATOR_TYPE
ITERATOR_TYPE
Specifies the iterator type to use.
Definition: Interfaces.cs:22

MyCaffe
The MyCaffe namespace contains the main body of MyCaffe code that closesly tracks the C++ Caffe open-...
Definition: Annotation.cs:12

System
Definition: Component.cs:11