mycaffe/html/_solver_8cs_source.html

using System;

using System.Collections.Generic;

using System.Linq;

using System.Text;

using System.Threading;

using System.IO;

using System.Diagnostics;

using System.Collections;

using MyCaffe.basecode;

using MyCaffe.db.image;

using MyCaffe.common;

using MyCaffe.param;


namespace MyCaffe.solvers

{

    public abstract class Solver<T> : IDisposable

    {

        protected CudaDnn<T> m_cuda;

        protected Log m_log;

        protected SolverParameter m_param;

        protected Net<T> m_net;

        protected List<Net<T>> m_rgTestNets = new List<Net<T>>();

        protected int m_nIter;

        protected int m_nCurrentStep;

        protected List<double> m_rgLosses = new List<double>();

        AutoResetEvent m_evtCompleted = new AutoResetEvent(false);

        bool m_bEnableTest = true;

        bool m_bEnableBlobDebugging = false;

        bool m_bEnableBreakOnNan = false;

        bool m_bEnableDetailedNanDetection = false;

        bool m_bEnableSingleStep = false;

        protected double m_dfSmoothedLoss = 0;

        protected double? m_dfIterAccuracy = null;

        Blob<T> m_blobAccuracy = null;

        CancelEvent m_evtCancel;

        AutoResetEvent m_evtForceSnapshot;

        AutoResetEvent m_evtForceTest;

        protected int m_nSolverCount = 1;

        protected int m_nSolverRank = 0;

        protected IXPersist<T> m_persist;

        protected double m_dfLearningRateOverride = 0;

        double m_dfLastAccuracy = 0;

        double m_dfLastError = double.MaxValue;

        double m_dfBestAccuracy = 0;

        double m_dfBestError = double.MaxValue;

        IXDatabaseBase m_db = null;

        int m_nTrainingIterationOverride = -1;

        int m_nTestingIterationOverride = -1;

        object m_tag = null;

        bool m_bWeightsUpdated = false;

        static object m_syncGetRi = new object();

        Blob<T> m_blobBatchInputData = null;

        double m_dfAverageTestTime = 0;

        SNAPSHOT_WEIGHT_UPDATE_METHOD m_snapshotWeightUpdatemMethod = SNAPSHOT_WEIGHT_UPDATE_METHOD.FAVOR_ACCURACY;

        int m_nTrainingTimeLimitInMinutes = 0;

        long m_hWorkspaceData = 0;  // shared among the layers and nets, only grows in size.

        ulong m_lWorkspaceSizeInBytes = 0;

        bool m_bFirstNanError = true;

        List<double> m_rgAverageAccuracyWindow = null;

        bool m_bForceTest = false;


        public event EventHandler OnStart;

        public event EventHandler OnAborted;

        public event EventHandler<GradientsReadyArgs> OnGradientsReady;

        public event EventHandler<SnapshotArgs> OnSnapshot;

        public event EventHandler<TrainingIterationArgs<T>> OnTrainingIteration;

        public event EventHandler<TestingIterationArgs<T>> OnTestingIteration;

        public event EventHandler<TestResultArgs<T>> OnTestResults;

        public event EventHandler<TestArgs> OnTest;

        public event EventHandler OnTestStart;

        public event EventHandler<CustomForwardBackArgs<T>> OnCustomForwardBack;

        public event EventHandler<WorkspaceArgs> OnGetWorkspace;

        public event EventHandler<WorkspaceArgs> OnSetWorkspace;


        public Solver(CudaDnn<T> cuda, Log log, SolverParameter p, CancelEvent evtCancel, AutoResetEvent evtForceSnapshot, AutoResetEvent evtForceTest, IXDatabaseBase db, IXPersist<T> persist, int nSolverCount = 1, int nSolverRank = 0, Net<T> shareNet = null, onGetWorkspace getws = null, onSetWorkspace setws = null)

        {

            m_cuda = cuda;

            m_log = log;

            m_evtCancel = evtCancel;

            m_evtForceSnapshot = evtForceSnapshot;

            m_evtForceTest = evtForceTest;


            if (m_log.IsEnabled)

                m_log.Enable = is_root_solver;


            m_db = db;

            m_persist = persist;

            m_nSolverCount = nSolverCount;

            m_nSolverRank = nSolverRank;


            if (getws != null)

                OnGetWorkspace += new EventHandler<WorkspaceArgs>(getws);


            if (setws != null)

                OnSetWorkspace += new EventHandler<WorkspaceArgs>(setws);


            if (p.accuracy_average_window > 0)

            {

                m_rgAverageAccuracyWindow = new List<double>();

                for (int i = 0; i < p.accuracy_average_window; i++)

                {

                    m_rgAverageAccuracyWindow.Add(0);

                }

            }


            Init(p, shareNet);

        }


        public void Dispose()

        {

            dispose();

        }


        public double LearningRateOverride

        {

            get { return m_dfLearningRateOverride; }

            set { m_dfLearningRateOverride = value; }

        }


        public bool ForceOnTrainingIterationEvent()

        {

            int nTimingCount = 0;

            double dfTotalTime = 0;

            return fireOnTrainingIterationEvent(false, 0, 0, ref nTimingCount, ref dfTotalTime);

        }


        private bool fireOnTrainingIterationEvent(bool bFwdPassNanFree, double dfLoss, double dfLastLearningRate, ref int nTimingCount, ref double dfTotalTime)

        {

            if (is_root_solver && OnTrainingIteration != null)

            {

                string strFirstNanBlob = null;

                DebugInformation<T> dbgInfo = null;


                if (m_bEnableBlobDebugging)

                {

                    dbgInfo = TrainingNet.GetDebugInformation(m_bEnableDetailedNanDetection);


                    if (m_bEnableBreakOnNan && dbgInfo != null)

                    {

                        string strType;

                        strFirstNanBlob = dbgInfo.DetectFirstNaN(out strType);


                        if (strFirstNanBlob != null)

                        {

                            string strPass = (!bFwdPassNanFree) ? "Forward" : "Backward";

                            m_log.WriteLine("First NaN detected in the '" + strType + "' of blob '" + strFirstNanBlob + "' after " + strPass + " pass.");


                            string strTypeLast;

                            string strLastNanBlob = dbgInfo.DetectLastNaN(out strTypeLast);


                            if (strLastNanBlob != strFirstNanBlob && strType != strTypeLast)

                                m_log.WriteLine("Last NaN detected in the '" + strTypeLast + "' of blob '" + strLastNanBlob + "' after " + strPass + " pass.");

                        }

                    }

                }


                double dfTime = (nTimingCount > 0) ? (dfTotalTime / nTimingCount) : 0;

                OnTrainingIteration(this, new TrainingIterationArgs<T>(m_nIter, m_dfLastAccuracy, dfLoss, m_dfSmoothedLoss, m_dfBestError, m_bWeightsUpdated, m_net.ActiveLabelCounts, m_net.LabelQueryHitPercents, m_net.LabelQueryEpochs, m_net.BoostQueryHitPercents, dfLastLearningRate, dfTime, dbgInfo));

                dfTotalTime = 0;

                nTimingCount = 0;


                if (strFirstNanBlob != null)

                {

                    m_log.WriteLine("Training is now stopping at iteration " + m_nIter.ToString("N0") + " as the first NaN has been detected ('" + strFirstNanBlob + "').");

                    return false;

                }

            }


            return true;

        }


        public int TrainingTimeLimitInMinutes

        {

            get { return m_nTrainingTimeLimitInMinutes; }

            set { m_nTrainingTimeLimitInMinutes = value; }

        }


        public SNAPSHOT_WEIGHT_UPDATE_METHOD SnapshotWeightUpdateMethod

        {

            get { return m_snapshotWeightUpdatemMethod; }

            set { m_snapshotWeightUpdatemMethod = value; }

        }


        public IXDatabaseBase Database

        {

            get { return m_db; }

        }


        protected virtual void dispose()

        {

            if (m_net != null)

            {

                m_net.Dispose();

                m_net = null;

            }


            foreach (Net<T> net in m_rgTestNets)

            {

                net.Dispose();

            }


            m_rgTestNets.Clear();


            if (m_blobBatchInputData != null)

            {

                m_blobBatchInputData.Dispose();

                m_blobBatchInputData = null;

            }


            if (m_hWorkspaceData != 0)

            {

                m_cuda.DisableGhostMemory();

                m_cuda.FreeMemory(m_hWorkspaceData);

                m_cuda.ResetGhostMemory();

                m_hWorkspaceData = 0;

                m_lWorkspaceSizeInBytes = 0;

            }

        }


        public bool EnableTesting

        {

            get { return m_bEnableTest; }

            set { m_bEnableTest = value; }

        }


        public bool EnableBlobDebugging

        {

            get { return m_bEnableBlobDebugging; }

            set { m_bEnableBlobDebugging = value; }

        }


        public bool EnableLayerDebugging

        {

            get { return TrainingNet.EnableLayerDebugging; }

            set { TrainingNet.EnableLayerDebugging = value; }

        }


        public bool EnableBreakOnFirstNaN

        {

            get { return m_bEnableBreakOnNan; }

            set { m_bEnableBreakOnNan = value; }

        }


        public bool EnableDetailedNanDetection

        {

            get { return m_bEnableDetailedNanDetection; }

            set { m_bEnableDetailedNanDetection = value; }

        }


        public bool EnableSingleStep

        {

            get { return m_bEnableSingleStep; }

            set { m_bEnableSingleStep = value; }

        }


        public bool WeightsUpdated

        {

            get { return m_bWeightsUpdated; }

            set { m_bWeightsUpdated = value; }

        }


        public object Tag

        {

            get { return m_tag; }

            set { m_tag = value; }

        }


        public Net<T> TestingNet

        {

            get

            {

                if (m_rgTestNets.Count == 0)

                    return null;


                return m_rgTestNets[0];

            }

        }


        public Net<T> TrainingNet

        {

            get { return m_net; }

        }


        public void Init(SolverParameter p, Net<T> shareNet = null)

        {

            m_log.WriteLine("Initializing solver from parameters: " + p.DebugString());

            m_param = p;

            m_log.CHECK_GE(m_param.average_loss, 1, "Average loss should be non-negative and >= 1.0.");


            if (m_param.random_seed >= 0)

                m_cuda.rng_setseed(m_param.random_seed + m_nSolverRank);


            // Scaffolding code.

            InitTrainNet(shareNet);

            InitTestNets();


            if (is_root_solver)

                m_log.WriteLine("Solver scaffolding done.");


            Reset();


            m_log.WriteLine("INFO: Solver created for " + m_param.eval_type.ToString() + " (NOTE: Detection is only for SSD models).", true);

        }


        public void Reset()

        {

            m_nIter = 0;

            m_nCurrentStep = 0;

        }


        protected void InitTrainNet(Net<T> shareNet = null)

        {

            try

            {

                int num_train_nets = ((m_param.net_param != null) ? 1 : 0) + ((m_param.train_net_param != null) ? 1 : 0);

                string field_names = "net_param, train_net_param";

                m_log.CHECK_GE(num_train_nets, 1, "SolverParameter must specify a train net using one of these fields: " + field_names);

                m_log.CHECK_LE(num_train_nets, 1, "SolverParameter must not contain more than one of these fields specifying a train_net: " + field_names);

                NetParameter net_param = null;


                if (m_param.train_net_param != null)

                {

                    m_log.WriteLine("Creating training net specified in train_net_param.");

                    net_param = m_param.train_net_param.Clone(true);

                }


                if (m_param.net_param != null)

                {

                    m_log.WriteLine("Creating training net specified in net_param.");

                    net_param = m_param.net_param.Clone(true);

                }


                // Set the correct NetState.  We start with the solver defaults (lowest

                // precedence); then, merge in any NetState specified by the net_param itself;

                // finally, merge in any NetState specified by the train-state (highest

                // precedence).

                NetState net_state = new NetState();

                net_state.phase = Phase.TRAIN;

                net_state.MergeFrom(net_param.state);

                net_state.MergeFrom(m_param.train_state);

                net_param.state = net_state;

                net_param.solver_count = m_nSolverCount;

                net_param.solver_rank = m_nSolverRank;

                m_net = new Net<T>(m_cuda, m_log, net_param, m_evtCancel, m_db, Phase.NONE, m_evtCompleted, shareNet, net_OnGetWorkspace, net_OnSetWorkspace);

                m_net.OnGetIteration += net_OnGetIteration;


                m_blobAccuracy = m_net.FindBlob("accuracy");

            }

            catch(Exception excpt)

            {

                throw new Exception("Initializing Training Net: " + excpt.Message);

            }

        }


        private void net_OnSetWorkspace(object sender, WorkspaceArgs e)

        {

            if (e.WorkspaceSizeInBytes == 0)

                return;


            if (OnSetWorkspace != null)

            {

                OnSetWorkspace(sender, e);

                return;

            }


            m_cuda.DisableGhostMemory();


            if (e.WorkspaceSizeInBytes > m_lWorkspaceSizeInBytes)

            {

                m_lWorkspaceSizeInBytes = e.WorkspaceSizeInBytes;


                if (m_hWorkspaceData != 0)

                    m_cuda.FreeMemory(m_hWorkspaceData);


                ulong lCount = CudaDnn<T>.ConvertByteSizeToCount(m_lWorkspaceSizeInBytes);

                m_hWorkspaceData = m_cuda.AllocMemory((long)lCount);

            }


            m_cuda.ResetGhostMemory();

        }


        private void net_OnGetWorkspace(object sender, WorkspaceArgs e)

        {

            if (OnGetWorkspace != null)

            {

                OnGetWorkspace(sender, e);

                return;

            }


            e.WorkspaceData = m_hWorkspaceData;

            e.WorkspaceSizeInBytes = m_lWorkspaceSizeInBytes;

        }


        private void net_OnGetIteration(object sender, GetIterationArgs e)

        {

            e.SetIteration(Phase.TRAIN, m_nIter);

        }


        protected void InitTestNets()

        {

            try

            {

                int num_generic_nets = ((m_param.net_param != null) ? 1 : 0);

                int num_test_net_params = m_param.test_net_param.Count;

                int num_test_nets = num_test_net_params;


                if (num_generic_nets > 0)

                    m_log.CHECK_GE(m_param.test_iter.Count, num_test_nets, "test_iter must be specified fore each test network.");

                else

                    m_log.CHECK_EQ(m_param.test_iter.Count, num_test_nets, "test_iter must be specified fore each test network.");


                // If we have a generic net (specified by net or net_param, rather than

                // test_net or test_net_param), we may have an unlimited number of actual

                // test networks -- the actual number is given by the number of remaining

                // test_iters after any test nets specified by test_net_param and/or test_net

                // are evaluated.

                int num_generic_net_instances = m_param.test_iter.Count - num_test_nets;

                int num_test_net_instances = num_test_nets + num_generic_net_instances;


                if (m_param.test_state.Count > 0)

                    m_log.CHECK_EQ(m_param.test_state.Count, num_test_net_instances, "test_state must be unspecified or specified once per test net.");


                if (num_test_net_instances > 0)

                    m_log.CHECK_GT(m_param.test_interval, 0, "The test interval must be greater than zero.");


                List<string> sources = new List<string>();

                List<NetParameter> net_params = new List<NetParameter>();


                for (int i = 0; i < num_test_net_params; i++)

                {

                    sources.Add("test_net_param");

                    net_params.Add(m_param.test_net_param[i].Clone());

                }


                int remaining_test_nets = m_param.test_iter.Count - num_test_net_params;


                if (m_param.net_param != null)

                {

                    for (int i = 0; i < remaining_test_nets; i++)

                    {

                        sources.Add("net_param");

                        net_params.Add(m_param.net_param.Clone());

                    }

                }


                m_rgTestNets = new List<Net<T>>();


                for (int i = 0; i < num_test_net_instances; i++)

                {

                    // Set the correct NetState. We start with the solver defaults (lowest

                    // precedence); then, merge in any NetState specified by the net_param

                    // itself; finally, merge in any NetState specified by the test_state

                    // (highest precedence).

                    NetState net_state = new NetState();

                    net_state.phase = Phase.TEST;

                    net_state.MergeFrom(net_params[i].state);


                    if (m_param.test_state.Count > 0)

                        net_state.MergeFrom(m_param.test_state[i]);


                    net_params[i].state = net_state;


                    m_log.WriteLine("Creating test net (#" + i.ToString() + ") specified by " + sources[i], true);

                    Net<T> net = new Net<T>(m_cuda, m_log, net_params[i], m_evtCancel, m_db, Phase.NONE, null, TrainingNet, net_OnGetWorkspace, net_OnSetWorkspace);


                    m_rgTestNets.Add(net);

                    m_rgTestNets[i].set_debug_info(m_param.debug_info);

                }

            }

            catch (Exception excpt)

            {

                throw new Exception("Initializing Testing Nets: " + excpt.Message);

            }

        }


        public CudaDnn<T> Cuda

        {

            get { return m_cuda; }

        }


        public string ActiveLabelCounts

        {

            get { return m_net.ActiveLabelCounts; }

        }


        public string LabelQueryHitPercents

        {

            get { return m_net.LabelQueryHitPercents; }

        }


        public string LabelQueryEpochs

        {

            get { return m_net.LabelQueryEpochs; }

        }


        public int CurrentIteration

        {

            get { return m_nIter; }

        }


        public int MaximumIteration

        {

            get { return m_param.max_iter; }

        }


        public int TrainingIterations

        {

            get

            {

                int nIters = m_param.max_iter - m_nIter;


                if (m_nTrainingIterationOverride > 0)

                    nIters = m_nTrainingIterationOverride;


                return nIters;

            }

        }


        public int TestingIterations

        {

            get

            {

                int nIters = (m_param.test_iter.Count == 0) ? 0 : m_param.test_iter[0];


                if (m_nTestingIterationOverride > 0)

                    nIters = m_nTestingIterationOverride;


                return nIters;

            }

        }


        public virtual void Solve(int nIterationOverride = -1, byte[] rgWeights = null, byte[] rgState = null, TRAIN_STEP step = TRAIN_STEP.NONE)

        {

            m_log.CHECK(is_root_solver, "Solve is only supported by the root solver.");

            m_log.WriteLine("Solving " + m_net.name);

            m_log.WriteLine("Learing Rate Policy: " + m_param.lr_policy);


            if (rgWeights != null || rgState != null)

                Restore(rgWeights, rgState);


            // For a network that is trained by the solver, no bottom or top vecs

            // should be given, and we will just provide dummy vecs.

            int start_iter = m_nIter;


            if (nIterationOverride <= 0)

                nIterationOverride = TrainingIterations;


            if (!Step(nIterationOverride, step))

                return;


            // If we haven't already, save a snapshot after optimization, unless

            // overriden by setting snapshot_after_train = false.

            if (step == TRAIN_STEP.NONE && (m_param.snapshot_after_train && (m_param.snapshot == 0 || (m_nIter % m_param.snapshot) != 0)))

                Snapshot(false, true);

            else if (m_net.learnable_parameters.SnapshotRequested(true))

                Snapshot(true, false);


            if (m_evtCancel.WaitOne(0))

            {

                m_log.WriteLine("Optimization stopped early.");

                return;

            }


            // After the optimization is done, run an additional train and test pass to

            // display the train and test loss/outputs if appropriate (based on the

            // display and test_interval settings, respectively).  Unlike in the rest of

            // training, for the train net we only run a forward pass as we've already

            // updated the parameters 'max_iter' times -- this final pass is only done to

            // display the loss, which is computed in the forward pass.

            if (m_param.display > 0 && (m_nIter % m_param.display) == 0)

            {

                double dfLoss;

                m_net.Forward(out dfLoss);


                UpdateSmoothedLoss(dfLoss, start_iter);

                m_log.WriteLine("Iteration " + m_nIter + ", loss = " + m_dfSmoothedLoss.ToString());

            }


            if (m_param.test_interval > 0 && (m_nIter % m_param.test_interval) == 0)

            {

                if (m_bEnableTest)

                    TestAll();

            }


            m_log.WriteLine("Optimization done.");


            if (m_blobBatchInputData != null)

            {

                m_blobBatchInputData.Dispose();

                m_blobBatchInputData = null;

            }

        }


        public bool Step(int nIters, TRAIN_STEP step = TRAIN_STEP.NONE, bool bZeroDiffs = true, bool bApplyUpdates = true, bool bDisableOutput = false, bool bDisableProgress = false, double? dfLossOverride = null, bool? bAllowSnapshot = null)

        {

            Exception err = null;


            try

            {

                BlobCollection<T> colBottom = new BlobCollection<T>();

                int start_iter = m_nIter;

                int stop_iter = m_nIter + nIters;


                m_rgLosses.Clear();

                m_dfSmoothedLoss = 0;


                // Break on first NaN is a debugging tool

                // that causes the network to stop training

                // right after a NaN is discovered either

                // just after the forward pass or just

                // after the backward pass.

                m_net.EnableBreakOnFirstNaN = m_bEnableBreakOnNan && m_bEnableBlobDebugging;

                m_net.EnableDetailedNanDetection = m_bEnableDetailedNanDetection & m_bEnableBlobDebugging;


                Stopwatch sw = new Stopwatch();

                sw.Start();


                Stopwatch swTimeout = new Stopwatch();

                swTimeout.Start();


                while (m_nIter < stop_iter && !m_evtCompleted.WaitOne(0))

                {

                    // zero-init the params.

                    if (bZeroDiffs)

                        m_net.ClearParamDiffs();


                    if (OnStart != null)

                        OnStart(this, new EventArgs());


                    if (step == TRAIN_STEP.NONE && (forceTest ||

                         (m_param.test_interval > 0 &&

                          (m_nIter % m_param.test_interval) == 0 &&

                          (m_nIter > 0 || m_param.test_initialization))))

                    {

                        if (m_bEnableTest && is_root_solver)

                            m_dfLastAccuracy = TestAll();


                        // Break out of the while loop because a stop was requested while testing.

                        if (m_evtCancel.WaitOne(0))

                            break;

                    }


                    // on_start currently not used, so no event added.

                    bool bDisplay1 = (is_root_solver && m_param.display > 0 && (m_nIter % m_param.display) == 0 && !bDisableOutput) ? true : false;

                    m_net.set_debug_info(bDisplay1 && m_param.debug_info);


                    // accumulate the loss and gradient

                    double dfLoss = 0;

                    double dfLossTotal = 0;

                    double? dfAccuracyTotal = null;

                    int nIterCount = 0;


                    Stopwatch swTiming = new Stopwatch();

                    double dfTotalTime = 0;

                    int nTimingCount = 0;

                    bool bFwdPassNanFree = true;


                    for (int i = 0; i < m_param.iter_size; i++)

                    {

                        double dfLocalLoss;

                        double? dfLocalAccuracy = null;


                        swTiming.Restart();


                        if (OnCustomForwardBack != null)

                        {

                            CustomForwardBackArgs<T> args = new CustomForwardBackArgs<T>(m_net, step);

                            OnCustomForwardBack(this, args);

                            bFwdPassNanFree = args.FwdPassNanFree;

                            dfLocalLoss = args.LocalLoss;

                        }

                        else

                        {

                            bFwdPassNanFree = m_net.ForwardBackward(colBottom, out dfLocalLoss, step);


                            if (m_blobAccuracy != null)

                                dfLocalAccuracy = Utility.ConvertVal<T>(m_blobAccuracy.GetData(0));

                        }


                        if (double.IsNaN(dfLocalLoss) || double.IsInfinity(dfLocalLoss))

                        {

                            if (m_bFirstNanError)

                            {

                                m_log.WriteError(new Exception("The local loss at iteration " + m_nIter.ToString() + " is invalid (NAN or INFINITY)!"));

                                m_bFirstNanError = false;

                            }

                        }


                        if (dfLocalAccuracy.HasValue)

                        {

                            if (!dfAccuracyTotal.HasValue)

                                dfAccuracyTotal = 0;


                            dfAccuracyTotal = dfAccuracyTotal + dfLocalAccuracy.Value;

                        }


                        dfLossTotal += dfLocalLoss;

                        swTiming.Stop();


                        dfTotalTime += swTiming.Elapsed.TotalMilliseconds;

                        nTimingCount++;

                        nIterCount++;


                        if (!bFwdPassNanFree)

                            break;

                    }


                    dfLoss = dfLossTotal / nIterCount;

                    dfLoss = dfLossOverride.GetValueOrDefault(dfLoss);


                    if (dfAccuracyTotal.HasValue)

                        m_dfIterAccuracy = dfAccuracyTotal.Value / nIterCount;


                    // average the loss across iterations for smoothed reporting

                    UpdateSmoothedLoss(dfLoss, start_iter);


                    bool bDisplay = false;

                    if (!bDisplay1 && sw.ElapsedMilliseconds > 2000 && !bDisableOutput)

                    {

                        bDisplay = true;

                        m_bFirstNanError = true;

                        sw.Restart();

                    }


                    if (bDisplay && bDisplay1)

                    {

                        m_log.WriteLine("Iteration " + m_nIter.ToString() + ", loss = " + m_dfSmoothedLoss.ToString());


                        BlobCollection<T> colResult = m_net.output_blobs;

                        int score_index = 0;


                        if (is_root_solver)

                        {

                            for (int j = 0; j < colResult.Count; j++)

                            {

                                double[] result_vec = Utility.ConvertVec<T>(colResult[j].update_cpu_data());

                                int nIdx = m_net.output_blob_indices[j];

                                string output_name = m_net.blob_names[nIdx];

                                double loss_weight = m_net.blob_loss_weights[nIdx];

                                double dfTotalLossWeight = 0;

                                int nResultCount = colResult[j].count();


                                for (int k = 0; k < nResultCount; k++)

                                {

                                    if (!m_param.output_average_results)

                                    {

                                        string strOut = "";


                                        if (loss_weight != 0)

                                            strOut += " (* " + loss_weight.ToString() + " = " + (loss_weight * result_vec[k]).ToString() + " loss)";


                                        m_log.WriteLine("    Train net output #" + score_index.ToString() + ": " + output_name + " = " + result_vec[k].ToString() + strOut);

                                        score_index++;

                                    }

                                    else

                                    {

                                        dfTotalLossWeight += loss_weight * result_vec[k];

                                    }

                                }


                                if (m_param.output_average_results)

                                {

                                    double dfAverage = dfTotalLossWeight / nResultCount;

                                    m_log.WriteLine("  Average weighted score = " + dfAverage.ToString() + " for '" + output_name + "' - averaged over " + nResultCount.ToString("N0") + " results.");

                                }

                            }

                        }

                    }


                    if (OnGradientsReady != null && bFwdPassNanFree)

                        OnGradientsReady(this, new GradientsReadyArgs());


                    double dfLastLearningRate = 0;


                    if (step != TRAIN_STEP.FORWARD && bApplyUpdates)

                        dfLastLearningRate = ApplyUpdate(m_nIter);


                    if (m_evtCancel.WaitOne(0))

                        break;


                    if (!bDisableProgress)

                        m_log.Progress = (double)m_nIter / (double)stop_iter;


                    bool bSnapshotTaken = false;

                    bool bForceSnapshot = forceSnapshot;


                    if ((step == TRAIN_STEP.NONE || bAllowSnapshot.GetValueOrDefault(false)) && (is_root_solver && bFwdPassNanFree &&

                        (bForceSnapshot ||

                         (m_param.snapshot > 0 && (m_nIter % m_param.snapshot) == 0) ||

                         (m_dfLastAccuracy > m_dfBestAccuracy))))

                    {

                        bSnapshotTaken = true;

                        Snapshot(bForceSnapshot, ((m_param.snapshot > 0 && (m_nIter % m_param.snapshot) == 0)) ? true : false);


                        if (m_dfLastAccuracy > m_dfBestAccuracy)

                            m_dfBestAccuracy = m_dfLastAccuracy;

                    }


                    //-------------------------------------

                    //  Call the training iteration event

                    //  on the root solver.

                    //-------------------------------------

                    fireOnTrainingIterationEvent(bFwdPassNanFree, dfLoss, dfLastLearningRate, ref nTimingCount, ref dfTotalTime);


                    //-------------------------------------

                    //  If single stepping, stop the solver.

                    //-------------------------------------

                    if (step != TRAIN_STEP.NONE || m_bEnableSingleStep)

                    {

                        if (step == TRAIN_STEP.BOTH)

                        {

                            if (!bDisableOutput)

                                m_log.WriteLine("Single step (both) triggered - solving stopped after a single forward/backward pass.");

                        }

                        else if (step == TRAIN_STEP.FORWARD)

                        {

                            if (!bDisableOutput)

                                m_log.WriteLine("Single step (forward) triggered - solving stopped after a single forward pass.");

                        }

                        else if (step == TRAIN_STEP.BACKWARD)

                        {

                            if (!bDisableOutput)

                                m_log.WriteLine("Single step (backward) triggered - solving stopped after a single backward pass.");

                        }

                        else

                        {

                            // When single stepping, force the snapshot so as to allow

                            //  debugging the net visually.

                            if (!bSnapshotTaken)

                                Snapshot(true, false);

                        }

                        break;

                    }


                    //-------------------------------------

                    //  If a time-limit has been imposed

                    //  and we have exceeded it, stop

                    //  training.

                    //-------------------------------------

                    if (m_nTrainingTimeLimitInMinutes > 0 && swTimeout.Elapsed.TotalMinutes > m_nTrainingTimeLimitInMinutes)

                    {

                        m_log.WriteLine("A training time-limit of " + m_nTrainingTimeLimitInMinutes.ToString("N0") + " minutes has been exceeded - training will now stop.");

                        return true;

                    }


                    if (!bApplyUpdates)

                        break;

                }


                return true;

            }

            catch (Exception excpt)

            {

                err = excpt;

                throw excpt;

            }

            finally

            {

                if (err != null || m_evtCancel.WaitOne(0))

                {

                    if (OnAborted != null)

                        OnAborted(this, new EventArgs());

                }

            }

        }


        public void Restore(byte[] rgWeights, byte[] rgState, string strSkipBlobTypes = null)

        {

            m_net.LoadWeights(rgWeights, m_persist, null, null, strSkipBlobTypes);


            if (rgState != null)

            {

                m_log.WriteLine("Restoring previous solver state from restore state...");

                RestoreSolverState(rgState);

            }

        }


        public void Snapshot(bool bForced, bool bScheduled, bool bUpdateDatabase = true)

        {

            m_log.WriteLine("Starting snap shot...");

            m_log.CHECK(is_root_solver, "Snapshot only supported on the root solver.");


            if (OnSnapshot == null)

                return;


            if (m_snapshotWeightUpdatemMethod == SNAPSHOT_WEIGHT_UPDATE_METHOD.DISABLED && !bForced)

            {

                m_log.WriteLine("WARNING: Snapshot UPDATE_METHOD = DISABLED.");

                return;

            }


            SnapshotArgs args = GetSnapshotArgs(null, null, m_dfLastAccuracy, m_dfLastError, m_nIter, m_snapshotWeightUpdatemMethod);

            args.Forced = bForced;

            args.Scheduled = bScheduled;

            args.UpdateDatabase = bUpdateDatabase;


            OnSnapshot(this, args);

            m_log.WriteLine("Snapshot completed.");

        }


        private void args_OnGetWeights(object sender, GetBytesArgs e)

        {

            if (m_net != null)

                e.Data = m_net.SaveWeights(m_persist, m_param.snapshot_diff);

        }


        private void args_OnGetState(object sender, GetBytesArgs e)

        {

            e.Data = SnapshotSolverState();

        }


        public SnapshotArgs GetSnapshotArgs(byte[] rgState, byte[] rgWeights, double dfAccuracy, double dfError, int nIteration, SNAPSHOT_WEIGHT_UPDATE_METHOD wtUpdt)

        {

            if (dfAccuracy == 0)

                dfAccuracy = 0.0001;


            SnapshotArgs args = new SnapshotArgs(rgState, rgWeights, dfAccuracy, dfError, nIteration, wtUpdt);


            args.IncludeState = m_param.snapshot_include_state;

            args.IncludeWeights = m_param.snapshot_include_weights;

            args.SingleStep = m_bEnableSingleStep;

            args.OnGetState += args_OnGetState;

            args.OnGetWeights += args_OnGetWeights;


            return args;

        }


        public int TrainingIterationOverride

        {

            get { return m_nTrainingIterationOverride; }

            set { m_nTrainingIterationOverride = value; }

        }


        public int TestingIterationOverride

        {

            get { return m_nTestingIterationOverride; }

            set { m_nTestingIterationOverride = value; }

        }


        public AutoResetEvent CompletedEvent

        {

            get { return m_evtCompleted; }

        }


        public CancelEvent CancelEvent

        {

            get { return m_evtCancel; }

        }


        public double smoothed_loss

        {

            get { return m_dfSmoothedLoss; }

        }


        public SolverParameter parameter

        {

            get { return m_param; }

        }


        public Net<T> net

        {

            get { return m_net; }

        }


        public List<Net<T>> test_nets

        {

            get { return m_rgTestNets; }

        }


        public int iter

        {

            get { return m_nIter; }

        }


        public SolverParameter.SolverType type

        {

            get { return m_param.type; }

        }


        protected bool forceSnapshot

        {

            get

            {

                if (m_evtForceSnapshot == null)

                    return false;


                return m_evtForceSnapshot.WaitOne(0);

            }

        }


        public bool forceTest

        {

            get

            {

                if (m_evtForceTest == null)

                    return false;


                m_bForceTest = m_evtForceTest.WaitOne(0);

                return m_bForceTest;

            }

        }


        public int solver_count

        {

            get { return m_nSolverCount; }

        }


        public int solver_rank

        {

            get { return m_nSolverRank;  }

        }


        public bool is_root_solver

        {

            get { return (m_nSolverRank == 0) ? true : false; }

        }


        public double TestAll(int nIterationOverride = -1)

        {

            double dfTotalAccuracy = 0;

            double dfTotalTime = 0;

            int nTotalCount = 0;


            for (int test_net_id = 0; test_net_id < m_rgTestNets.Count; test_net_id++)

            {

                if (m_evtCancel.WaitOne(0))

                    return 0;


                if (OnTest != null)

                {

                    TestArgs args = new TestArgs(nIterationOverride, test_net_id);

                    OnTest(this, args);

                    dfTotalAccuracy += args.Accuracy;

                }

                else

                    dfTotalAccuracy += testOne(nIterationOverride, test_net_id);


                dfTotalTime += m_dfAverageTestTime;

                nTotalCount++;

            }


            if (m_rgTestNets.Count == 0)

            {

                if (OnTest != null)

                {

                    TestArgs args = new TestArgs(nIterationOverride, 0);

                    OnTest(this, args);

                    dfTotalAccuracy += args.Accuracy;

                }

                else

                    dfTotalAccuracy += testOne(nIterationOverride, 0);

            }


            double dfAccuracy = (m_rgTestNets.Count > 0) ? dfTotalAccuracy / m_rgTestNets.Count : 0;


            if (m_rgAverageAccuracyWindow != null)

            {

                m_rgAverageAccuracyWindow.Add(dfAccuracy);

                m_rgAverageAccuracyWindow.RemoveAt(0);

                dfAccuracy = m_rgAverageAccuracyWindow.Average();

            }


            if (OnTestingIteration != null)

            {

                double dfTime = (nTotalCount > 0) ? dfTotalTime / nTotalCount : 0;

                OnTestingIteration(this, new TestingIterationArgs<T>(m_nIter, dfAccuracy, dfTime));

            }


            return dfAccuracy;

        }


        private double testOne(int nIterationOverride = -1, int nTestNetId = 0)

        {

            switch (m_param.eval_type)

            {

                // Test SSD Detection

                case SolverParameter.EvaluationType.DETECTION:

                    return TestDetection(nIterationOverride, nTestNetId);


                // Perform regular classification Test.

                default:

                    return TestClassification(nIterationOverride, nTestNetId);

            }

        }


        public double TestDetection(int nIterationOverride = -1, int nTestNetId = 0)

        {

            Stopwatch sw = new Stopwatch();

            BBoxUtility<T> bboxUtil = new BBoxUtility<T>(m_cuda, m_log);


            try

            {

                if (is_root_solver)

                    m_log.WriteLine("Iteration " + m_nIter.ToString() + ", Testing net (#" + nTestNetId.ToString() + ")");


                Net<T> test_net = m_net;


                if (m_rgTestNets.Count > nTestNetId)

                {

                    m_log.CHECK(m_rgTestNets[nTestNetId] != null, "The test net at " + nTestNetId.ToString() + " is null!");

                    m_rgTestNets[nTestNetId].ShareTrainedLayersWith(m_net);

                    test_net = m_rgTestNets[nTestNetId];

                }


                Dictionary<int, Dictionary<int, List<Tuple<float, int>>>> rgAllTruePos = new Dictionary<int, Dictionary<int, List<Tuple<float, int>>>>();

                Dictionary<int, Dictionary<int, List<Tuple<float, int>>>> rgAllFalsePos = new Dictionary<int, Dictionary<int, List<Tuple<float, int>>>>();

                Dictionary<int, Dictionary<int, int>> rgAllNumPos = new Dictionary<int, Dictionary<int, int>>();


                double dfLoss = 0;


                if (nIterationOverride <= 0)

                    nIterationOverride = TestingIterations;


                int nIter = nIterationOverride;

                sw.Start();


                for (int i = 0; i < nIter; i++)

                {

                    // Check to see if stoppage of testing/training has been requested.

                    if (m_evtCancel.WaitOne(0))

                        break;


                    if (OnTestStart != null)

                        OnTestStart(this, new EventArgs());


                    double iter_loss;

                    BlobCollection<T> colResult = test_net.Forward(out iter_loss);


                    if (m_param.test_compute_loss)

                        dfLoss += iter_loss;


                    for (int j = 0; j < colResult.Count; j++)

                    {

                        m_log.CHECK_EQ(colResult[j].width, 5, "The width must be = 5 for SSD.");

                        double[] result_vec = Utility.ConvertVec<T>(colResult[j].update_cpu_data());

                        int num_det = colResult[j].height;


                        for (int k = 0; k < num_det; k++)

                        {

                            int item_id = (int)result_vec[k * 5];

                            int nLabel = (int)result_vec[k * 5 + 1];


                            // Special row for storing number of positives for a label.

                            if (item_id == -1)

                            {

                                if (!rgAllNumPos.ContainsKey(j))

                                    rgAllNumPos.Add(j, new Dictionary<int, int>());


                                if (!rgAllNumPos[j].ContainsKey(nLabel))

                                    rgAllNumPos[j].Add(nLabel, (int)result_vec[k * 5 + 2]);

                                else

                                    rgAllNumPos[j][nLabel] += (int)result_vec[k * 5 + 2];

                            }

                            // Normal row storing detection status.

                            else

                            {

                                float fScore = (float)result_vec[k * 5 + 2];

                                int tp = (int)result_vec[k * 5 + 3];

                                int fp = (int)result_vec[k * 5 + 4];


                                // Ignore such case, which happens when a detection bbox is matched to

                                // a difficult gt bbox and we don't evaluate on difficult gt bbox.

                                if (tp == 0 && fp == 0)

                                    continue;


                                if (!rgAllTruePos.ContainsKey(j))

                                    rgAllTruePos.Add(j, new Dictionary<int, List<Tuple<float, int>>>());


                                if (!rgAllTruePos[j].ContainsKey(nLabel))

                                    rgAllTruePos[j].Add(nLabel, new List<Tuple<float, int>>());


                                if (!rgAllFalsePos.ContainsKey(j))

                                    rgAllFalsePos.Add(j, new Dictionary<int, List<Tuple<float, int>>>());


                                if (!rgAllFalsePos[j].ContainsKey(nLabel))

                                    rgAllFalsePos[j].Add(nLabel, new List<Tuple<float, int>>());


                                rgAllTruePos[j][nLabel].Add(new Tuple<float, int>(fScore, tp));

                                rgAllFalsePos[j][nLabel].Add(new Tuple<float, int>(fScore, fp));

                            }

                        }

                    }


                    if (sw.Elapsed.TotalMilliseconds > 1000)

                    {

                        m_log.Progress = (double)i / (double)nIter;

                        m_log.WriteLine("Testing at " + m_log.Progress.ToString("P") + " " + i.ToString() + " of " + nIter.ToString() + "...");

                        sw.Restart();

                    }

                }


                if (m_evtCancel.WaitOne(0))

                {

                    m_log.WriteLine("Test interrupted.");

                    return 0;

                }


                if (m_param.test_compute_loss)

                {

                    dfLoss /= m_param.test_iter[nTestNetId];

                    m_log.WriteLine("Test loss: " + dfLoss.ToString());

                }


                float fTotalmAP = 0;

                for (int i = 0; i < rgAllTruePos.Count; i++)

                {

                    if (!rgAllTruePos.ContainsKey(i))

                        m_log.FAIL("Missing output_blob true_pos: " + i.ToString());


                    Dictionary<int, List<Tuple<float, int>>> rgTruePos = rgAllTruePos[i];


                    if (!rgAllFalsePos.ContainsKey(i))

                        m_log.FAIL("Missing output_blob false_pos: " + i.ToString());


                    Dictionary<int, List<Tuple<float, int>>> rgFalsePos = rgAllFalsePos[i];


                    if (!rgAllNumPos.ContainsKey(i))

                        m_log.FAIL("Missing output_blob num_pos: " + i.ToString());


                    Dictionary<int, int> rgNumPos = rgAllNumPos[i];


                    Dictionary<int, float> rgAPs = new Dictionary<int, float>();

                    float fmAP = 0.0f;


                    // Sort true_pos and false_pos with descending scores.

                    foreach (KeyValuePair<int, int> kv in rgNumPos)

                    {

                        int nLabel = kv.Key;

                        int nLabelNumPos = kv.Value;


                        if (!rgTruePos.ContainsKey(nLabel))

                        {

                            m_log.WriteLine("WARNING: Missing true_pos for label: " + nLabel.ToString() + "!");

                            continue;

                        }

                        List<Tuple<float, int>> rgLabelTruePos = rgTruePos[nLabel];


                        if (!rgFalsePos.ContainsKey(nLabel))

                        {

                            m_log.WriteLine("WARNING: Missing false_pos for label: " + nLabel.ToString() + "!");

                            continue;

                        }

                        List<Tuple<float, int>> rgLabelFalsePos = rgFalsePos[nLabel];


                        List<float> rgPrec;

                        List<float> rgRec;

                        float fAp = bboxUtil.ComputeAP(rgLabelTruePos, nLabelNumPos, rgLabelFalsePos, m_param.ap_version, out rgPrec, out rgRec);


                        if (!rgAPs.ContainsKey(nLabel))

                            rgAPs.Add(nLabel, fAp);

                        else

                            rgAPs[nLabel] = fAp;


                        fmAP += fAp;


                        if (m_param.show_per_class_result)

                            m_log.WriteLine("class " + nLabel.ToString() + ": " + fAp.ToString());

                    }


                    fmAP /= rgNumPos.Count;


                    int nOutputBlobIdx = test_net.output_blob_indices[i];

                    string strOutputName = test_net.blob_names[nOutputBlobIdx];


                    m_log.WriteLine("    Test net output #" + i.ToString() + ": " + strOutputName + " = " + fmAP.ToString());

                    fTotalmAP += fmAP;

                }


                return fTotalmAP / rgAllTruePos.Count;

            }

            catch (Exception excpt)

            {

                throw excpt;

            }

            finally

            {

                bboxUtil.Dispose();

            }

        }


        public double TestClassification(int nIterationOverride = -1, int nTestNetId = 0)

        {

            bool bDisplay = (is_root_solver && m_param.display > 0 && (m_nIter % m_param.display) == 0) ? true : false;


            if (m_bForceTest)

            {

                m_bForceTest = false;

                bDisplay = true;

            }


            if (bDisplay)

                m_log.WriteLine("Iteration " + m_nIter.ToString() + ", Testing net (#" + nTestNetId.ToString() + ")");


            Net<T> test_net = m_net;


            if (m_rgTestNets.Count > nTestNetId)

            {

                m_log.CHECK(m_rgTestNets[nTestNetId] != null, "The test net at " + nTestNetId.ToString() + " is null!");

                m_rgTestNets[nTestNetId].ShareTrainedLayersWith(m_net);

                test_net = m_rgTestNets[nTestNetId];

            }


            List<double> test_score = new List<double>();

            List<int> test_score_output_id = new List<int>();

            double dfLoss = 0;


            if (nIterationOverride <= 0)

                nIterationOverride = TestingIterations;


            int nIter = nIterationOverride;


            Stopwatch sw = new Stopwatch();

            sw.Start();


            double dfTotalTiming = 0;

            int nTestCount = 0;

            int nAccuracyIdx = 0;

            int nMinRank = int.MaxValue;

            bool bAccuracyValid = false;

            Stopwatch swTiming = new Stopwatch();


            for (int i = 0; i < nIter; i++)

            {

                // Check to see if stoppage of testing/training has been requested.

                if (m_evtCancel.WaitOne(0))

                    break;


                if (OnTestStart != null)

                    OnTestStart(this, new EventArgs());


                swTiming.Restart();


                double iter_loss;

                BlobCollection<T> colResult = test_net.Forward(out iter_loss);


                if (m_param.test_compute_loss)

                    dfLoss += iter_loss;


                TestResultArgs<T> args = new TestResultArgs<T>(colResult);

                if (OnTestResults != null)

                {

                    OnTestResults(this, args);

                    if (args.AccuracyValid)

                    {

                        test_score.Add(args.Accuracy);

                        test_score_output_id.Add(1);

                        bAccuracyValid = true;

                    }

                }


                if (!args.AccuracyValid)

                {

                    if (i == 0)

                    {

                        for (int j = 0; j < colResult.Count; j++)

                        {

                            double[] result_vec = Utility.ConvertVec<T>(colResult[j].update_cpu_data());


                            for (int k = 0; k < colResult[j].count(); k++)

                            {

                                test_score.Add(result_vec[k]);

                                test_score_output_id.Add(j);

                            }


                            if (colResult[j].type == BLOB_TYPE.ACCURACY)

                            {

                                int nRank = (int)getNumber(colResult[j].Tag, 0);

                                if (nRank < nMinRank)

                                {

                                    nMinRank = nRank;

                                    nAccuracyIdx = j;

                                }

                            }

                        }

                    }

                    else

                    {

                        int idx = 0;


                        for (int j = 0; j < colResult.Count; j++)

                        {

                            double[] result_vec = Utility.ConvertVec<T>(colResult[j].update_cpu_data());


                            for (int k = 0; k < colResult[j].count(); k++)

                            {

                                test_score[idx] += result_vec[k];

                                idx++;

                            }

                        }

                    }

                }


                swTiming.Stop();

                dfTotalTiming += swTiming.Elapsed.TotalMilliseconds;

                nTestCount++;


                if (sw.ElapsedMilliseconds > 2000)

                {

                    double dfPct = (double)i / (double)nIter;


                    if (bDisplay)

                    {

                        m_log.Progress = dfPct;

                        m_log.WriteLine("Testing '" + test_net.name + "' at " + dfPct.ToString("P"));

                    }


                    sw.Restart();

                }

            }


            m_dfAverageTestTime = (nTestCount > 0) ? dfTotalTiming / nTestCount : 0;


            if (m_evtCancel.WaitOne(0))

            {

                m_log.WriteLine("Test interrupted.");

                return 0;

            }


            if (m_param.test_compute_loss)

            {

                dfLoss /= m_param.test_iter[nTestNetId];

                m_log.WriteLine("Test loss: " + dfLoss.ToString());

            }


            double dfFinalScore = 0;


            if (bAccuracyValid)

            {

                dfFinalScore = test_score.Sum();

                int nTotal = test_score_output_id.Sum();

                dfFinalScore /= nTotal;

            }

            else

            {

                for (int i = 0; i < test_score.Count; i++)

                {

                    int nIdxTestScore = test_score_output_id[i];

                    int output_blob_index = test_net.output_blob_indices[nIdxTestScore];

                    string output_name = test_net.blob_names[output_blob_index];

                    double loss_weight = test_net.blob_loss_weights[output_blob_index];

                    double dfMeanScore = test_score[i] / nIter;

                    string strOut = "";


                    if (bDisplay)

                    {

                        if (loss_weight != 0)

                            strOut += " (* " + loss_weight.ToString() + " = " + (loss_weight * dfMeanScore).ToString() + " loss)";


                        m_log.WriteLine("   Test net output #" + i.ToString() + ": " + output_name + " = " + dfMeanScore.ToString() + strOut);

                    }


                    if (i == nAccuracyIdx)

                        dfFinalScore = dfMeanScore;

                }

            }


            if (test_score.Count == 0)

                return 0;


            return dfFinalScore;

        }


        private double getNumber(object value, double dfDefault)

        {

            if (value == null)

                return dfDefault;


            if (value is sbyte)

                return (double)(sbyte)value;


            if (value is byte)

                return (double)(byte)value;


            if (value is short)

                return (double)(short)value;


            if (value is ushort)

                return (double)(ushort)value;


            if (value is int)

                return (double)(int)value;


            if (value is uint)

                return (double)(uint)value;


            if (value is long)

                return (double)(long)value;


            if (value is ulong)

                return (double)(ulong)value;


            if (value is float)

                return (double)(float)value;


            if (value is double)

                return (double)value;


            if (value is decimal)

                return (double)(decimal)value;


            return dfDefault;

        }


        public void UpdateSmoothedLoss(double dfLoss, int nStartIter, int nAverageLoss = 0)

        {

            if (nAverageLoss == 0)

                nAverageLoss = m_param.average_loss;


            if (m_rgLosses.Count < nAverageLoss)

            {

                m_rgLosses.Add(dfLoss);

                int nCount = m_rgLosses.Count;

                m_dfSmoothedLoss = (m_dfSmoothedLoss * (nCount - 1) + dfLoss) / nCount;

            }

            else

            {

                int nIdx = (m_nIter - nStartIter) % nAverageLoss;

                m_dfSmoothedLoss += (dfLoss - m_rgLosses[nIdx]) / nAverageLoss;

                m_rgLosses[nIdx] = dfLoss;

            }


            if (m_bWeightsUpdated)

            {

                m_dfSmoothedLoss = dfLoss;

                m_bWeightsUpdated = false;

            }


            m_dfLastError = m_dfSmoothedLoss;


            if (m_dfLastError < m_dfBestError)

                m_dfBestError = m_dfLastError;

        }


        public abstract double ApplyUpdate(int nIterationOverride = -1);


        protected abstract byte[] SnapshotSolverState();


        protected abstract void RestoreSolverState(byte[] rgState);


        public static SGDSolver<T> Create(CudaDnn<T> cuda, Log log, ProjectEx p, CancelEvent evtCancel, AutoResetEvent evtForceSnapshot, AutoResetEvent evtForceTest, IXDatabaseBase db, IXPersist<T> persist, int nSolverCount = 1, int nSolverRank = 0, Net<T> shareNet = null, onGetWorkspace getws = null, onSetWorkspace setws = null)

        {

            SolverParameter solverParam = null;


            if (p.SolverDescription != null)

            {

                RawProto protoSolver = RawProto.Parse(p.SolverDescription);

                solverParam = SolverParameter.FromProto(protoSolver);

            }

            else

            {

                solverParam = new param.SolverParameter();

            }


            if (solverParam.net_param == null)

            {

                RawProto protoModel = RawProto.Parse(p.ModelDescription);

                solverParam.net_param = NetParameter.FromProto(protoModel);

                solverParam.net_param.ProjectID = p.ID;

            }


            return Create(cuda, log, solverParam, evtCancel, evtForceSnapshot, evtForceTest, db, persist, nSolverCount, nSolverRank, shareNet, getws, setws);

        }


        public static SGDSolver<T> Create(CudaDnn<T> cuda, Log log, SolverParameter solverParam, CancelEvent evtCancel, AutoResetEvent evtForceSnapshot, AutoResetEvent evtForceTest, IXDatabaseBase db, IXPersist<T> persist, int nSolverCount = 1, int nSolverRank = 0, Net<T> shareNet = null, onGetWorkspace getws = null, onSetWorkspace setws = null)

        {

            SGDSolver<T> solver = null;


            switch (solverParam.type)

            {

                case SolverParameter.SolverType.SGD:

                    solver = new SGDSolver<T>(cuda, log, solverParam, evtCancel, evtForceSnapshot, evtForceTest, db, persist, nSolverCount, nSolverRank, shareNet, getws, setws);

                    break;


                case SolverParameter.SolverType.NESTEROV:

                    solver = new NesterovSolver<T>(cuda, log, solverParam, evtCancel, evtForceSnapshot, evtForceTest, db, persist, nSolverCount, nSolverRank, shareNet, getws, setws);

                    break;


                case SolverParameter.SolverType.ADAGRAD:

                    solver = new AdaGradSolver<T>(cuda, log, solverParam, evtCancel, evtForceSnapshot, evtForceTest, db, persist, nSolverCount, nSolverRank, shareNet, getws, setws);

                    break;


                case SolverParameter.SolverType.ADADELTA:

                    solver = new AdaDeltaSolver<T>(cuda, log, solverParam, evtCancel, evtForceSnapshot, evtForceTest, db, persist, nSolverCount, nSolverRank, shareNet, getws, setws);

                    break;


                case SolverParameter.SolverType.ADAM:

                    solver = new AdamSolver<T>(cuda, log, solverParam, evtCancel, evtForceSnapshot, evtForceTest, db, persist, nSolverCount, nSolverRank, shareNet, getws, setws);

                    break;


                case SolverParameter.SolverType.ADAMW:

                    solver = new AdamWSolver<T>(cuda, log, solverParam, evtCancel, evtForceSnapshot, evtForceTest, db, persist, nSolverCount, nSolverRank, shareNet, getws, setws);

                    break;


                case SolverParameter.SolverType.RMSPROP:

                    solver = new RmsPropSolver<T>(cuda, log, solverParam, evtCancel, evtForceSnapshot, evtForceTest, db, persist, nSolverCount, nSolverRank, shareNet, getws, setws);

                    break;


                default:

                    throw new NotImplementedException("The solver " + solverParam.type.ToString() + " is not implemented yet!");

            }


            return solver;

        }

    }


#pragma warning disable 1591


    public class OutputCollection

    {

        OutputDataCollection m_rgError = new OutputDataCollection();

        OutputDataCollection m_rgAccuracy = new OutputDataCollection();


        public OutputCollection()

        {

        }


        public OutputDataCollection Errors

        {

            get { return m_rgError; }

        }


        public OutputDataCollection Accuracies

        {

            get { return m_rgAccuracy; }

        }

    }


    public class OutputDataCollection : IEnumerable<OutputData>

    {

        List<OutputData> m_rgData = new List<OutputData>();


        public OutputDataCollection()

        {

        }


        public List<OutputData> Data

        {

            get { return m_rgData; }

        }


        public int Count

        {

            get { return m_rgData.Count; }

        }


        public OutputData this[int nIdx]

        {

            get { return m_rgData[nIdx]; }

            set { m_rgData[nIdx] = value; }

        }


        public void Add(int nTotal, string strName, int nIdx, double dfVal)

        {

            OutputData data = Find(strName);


            if (data == null)

            {

                data = new OutputData(strName, nIdx);

                m_rgData.Add(data);

            }


            data.Add(nTotal, dfVal);

        }


        public OutputData Find(string strName)

        {

            foreach (OutputData data in m_rgData)

            {

                if (data.Name == strName)

                    return data;

            }


            return null;

        }


        public IEnumerator<OutputData> GetEnumerator()

        {

            return m_rgData.GetEnumerator();

        }


        IEnumerator IEnumerable.GetEnumerator()

        {

            return m_rgData.GetEnumerator();

        }

    }


    public class OutputData

    {

        string m_strName;

        double m_dfValue = 0;

        int m_nIdx;


        public OutputData(string strName, int nIdx)

        {

            m_strName = strName;

            m_nIdx = nIdx;

        }


        public int Index

        {

            get { return m_nIdx; }

        }


        public string Name

        {

            get { return m_strName; }

        }


        public double Value

        {

            get { return m_dfValue; }

            set { m_dfValue = value; }

        }


        public void Add(int nTotal, double dfVal)

        {

            double dfRatio = 1.0 / (double)nTotal;

            m_dfValue = (m_dfValue * (1.0 - dfRatio)) + (dfRatio * dfVal);

        }

    }


#pragma warning restore 1591

}

MyCaffe.basecode.CancelEvent
The CancelEvent provides an extension to the manual cancel event that allows for overriding the manua...
Definition: CancelEvent.cs:17

MyCaffe.basecode.CancelEvent.WaitOne
bool WaitOne(int nMs=int.MaxValue)
Waits for the signal state to occur.
Definition: CancelEvent.cs:290

MyCaffe.basecode.Log
The Log class provides general output in text form.
Definition: Log.cs:13

MyCaffe.basecode.Log.CHECK
void CHECK(bool b, string str)
Test a flag for true.
Definition: Log.cs:227

MyCaffe.basecode.Log.IsEnabled
bool IsEnabled
Returns whether or not the Log is enabled.
Definition: Log.cs:50

MyCaffe.basecode.Log.WriteLine
void WriteLine(string str, bool bOverrideEnabled=false, bool bHeader=false, bool bError=false, bool bDisable=false)
Write a line of output.
Definition: Log.cs:80

MyCaffe.basecode.Log.Enable
bool Enable
Enables/disables the Log. When disabled, the Log does not output any data.
Definition: Log.cs:42

MyCaffe.basecode.Log.FAIL
void FAIL(string str)
Causes a failure which throws an exception with the desciptive text.
Definition: Log.cs:394

MyCaffe.basecode.Log.Progress
double Progress
Get/set the progress associated with the Log.
Definition: Log.cs:147

MyCaffe.basecode.Log.CHECK_EQ
void CHECK_EQ(double df1, double df2, string str)
Test whether one number is equal to another.
Definition: Log.cs:239

MyCaffe.basecode.Log.WriteError
void WriteError(Exception e)
Write an error as output.
Definition: Log.cs:130

MyCaffe.basecode.Log.CHECK_GT
void CHECK_GT(double df1, double df2, string str)
Test whether one number is greater than another.
Definition: Log.cs:299

MyCaffe.basecode.Log.CHECK_LE
void CHECK_LE(double df1, double df2, string str)
Test whether one number is less than or equal to another.
Definition: Log.cs:263

MyCaffe.basecode.Log.CHECK_GE
void CHECK_GE(double df1, double df2, string str)
Test whether one number is greater than or equal to another.
Definition: Log.cs:287

MyCaffe.basecode.ProjectEx
The ProjectEx class manages a project containing the solver description, model description,...
Definition: ProjectEx.cs:15

MyCaffe.basecode.ProjectEx.SolverDescription
string? SolverDescription
Get/set the solver description script used by the Project.
Definition: ProjectEx.cs:726

MyCaffe.basecode.ProjectEx.ID
int ID
Returns the ID of the Project in the database.
Definition: ProjectEx.cs:533

MyCaffe.basecode.ProjectEx.ModelDescription
string? ModelDescription
Get/set the model description script used by the Project.
Definition: ProjectEx.cs:757

MyCaffe.basecode.RawProto
The RawProto class is used to parse and output Google prototxt file data.
Definition: RawProto.cs:17

MyCaffe.basecode.RawProto.Parse
static RawProto Parse(string str)
Parses a prototxt and places it in a new RawProto.
Definition: RawProto.cs:306

MyCaffe.basecode.Utility
The Utility class provides general utility funtions.
Definition: Utility.cs:35

MyCaffe.basecode.Utility.ConvertVec
static double[] ConvertVec(float[] rgf)
Convert an array of float to an array of generics.
Definition: Utility.cs:550

MyCaffe.common.BBoxUtility
The BBox class processes the NormalizedBBox data used with SSD.
Definition: BBoxUtility.cs:22

MyCaffe.common.BBoxUtility.Dispose
void Dispose()
Clean up all resources.
Definition: BBoxUtility.cs:43

MyCaffe.common.BBoxUtility.ComputeAP
float ComputeAP(List< Tuple< float, int > > rgTp, int nNumPos, List< Tuple< float, int > > rgFp, ApVersion apVersion, out List< float > rgPrec, out List< float > rgRec)
Compute the average precision given true positive and false positive vectors.
Definition: BBoxUtility.cs:69

MyCaffe.common.BlobCollection
The BlobCollection contains a list of Blobs.
Definition: BlobCollection.cs:16

MyCaffe.common.BlobCollection.Add
void Add(Blob< T > b)
Add a new Blob to the collection.
Definition: BlobCollection.cs:92

MyCaffe.common.BlobCollection.Count
int Count
Returns the number of items in the collection.
Definition: BlobCollection.cs:30

MyCaffe.common.Blob
The Blob is the main holder of data that moves through the Layers of the Net.
Definition: Blob.cs:25

MyCaffe.common.Blob.GetData
T GetData(int nIdx)
Returns the data at a given flat index within the Blob.
Definition: Blob.cs:1893

MyCaffe.common.Blob.Dispose
virtual void Dispose(bool bDisposing)
Releases all resources used by the Blob (including both GPU and Host).
Definition: Blob.cs:402

MyCaffe.common.CudaDnn
The CudaDnn object is the main interface to the Low-Level Cuda C++ DLL.
Definition: CudaDnn.cs:969

MyCaffe.common.CudaDnn.ConvertByteSizeToCount
static ulong ConvertByteSizeToCount(ulong ulSizeInBytes)
Converts the byte size into the number of items in the base data type of float or double.
Definition: CudaDnn.cs:2438

MyCaffe.common.CustomForwardBackArgs
The CustomForwardBackArgs provide the arguments to the OnCustomForwardBack event within the Solver St...
Definition: EventArgs.cs:609

MyCaffe.common.CustomForwardBackArgs.LocalLoss
double LocalLoss
Get/set the local loss of the pass.
Definition: EventArgs.cs:655

MyCaffe.common.CustomForwardBackArgs.FwdPassNanFree
bool FwdPassNanFree
Get/set whether or a NAN was detected in the forward pass.
Definition: EventArgs.cs:646

MyCaffe.common.DebugInformation
The DebugInformation contains information used to help debug the Layers of a Net while it is training...
Definition: DebugInformation.cs:16

MyCaffe.common.DebugInformation.DetectFirstNaN
string DetectFirstNaN(out string strType)
Searches for the first NaN within any of the Layers.
Definition: DebugInformation.cs:127

MyCaffe.common.DebugInformation.DetectLastNaN
string DetectLastNaN(out string strType)
Searches for the last NaN within any of the Layers.
Definition: DebugInformation.cs:147

MyCaffe.common.GetBytesArgs
The GetBytesArgs is passed along to the SnapshotArgs::OnGetWeights and SnapshotArgs::OnGetState event...
Definition: EventArgs.cs:392

MyCaffe.common.GetBytesArgs.Data
byte[] Data
Get/set the data as an array of bytes.
Definition: EventArgs.cs:406

MyCaffe.common.GetIterationArgs
The GetIterationArgs is sent bubbled up to the solver when a layer needs to know the curret training ...
Definition: EventArgs.cs:748

MyCaffe.common.GetIterationArgs.SetIteration
void SetIteration(Phase p, int nIteration)
The SetIteration method is used to set the iteration and the phase.
Definition: EventArgs.cs:764

MyCaffe.common.GradientsReadyArgs
The GradientsReadyArgs is sent to the Solver::OnGradientsReady event which fires at the end of each S...
Definition: EventArgs.cs:734

MyCaffe.common.Net
Connects Layer's together into a direct acrylic graph (DAG) specified by a NetParameter
Definition: Net.cs:23

MyCaffe.common.Net.Forward
BlobCollection< T > Forward()
Run forward with the input Blob's already fed separately.
Definition: Net.cs:1445

MyCaffe.common.Net.blob_names
List< string > blob_names
Returns the blob names.
Definition: Net.cs:1987

MyCaffe.common.Net.blob_loss_weights
List< double > blob_loss_weights
Returns the collection of blob loss weights.
Definition: Net.cs:2069

MyCaffe.common.Net.name
string name
Returns the network name.
Definition: Net.cs:1971

MyCaffe.common.Net.output_blob_indices
List< int > output_blob_indices
Returns a list of the output Blob indexes.
Definition: Net.cs:2217

MyCaffe.common.SnapshotArgs
The SnapshotArgs is sent to the Solver::OnSnapshot event which fires each time the Solver::Snapshot m...
Definition: EventArgs.cs:416

MyCaffe.common.SnapshotArgs.Forced
bool Forced
Get/set whether or not the snapshot was forced or not.
Definition: EventArgs.cs:580

MyCaffe.common.SnapshotArgs.SingleStep
bool SingleStep
Get/set the Solver single step.
Definition: EventArgs.cs:571

MyCaffe.common.SnapshotArgs.IncludeWeights
bool IncludeWeights
Get/set whether or not to include the weights in the snapshot.
Definition: EventArgs.cs:553

MyCaffe.common.SnapshotArgs.Scheduled
bool Scheduled
Get/set whether or not the snapshot is a regular scheduled snapshot (e.g. not an improved accuracy or...
Definition: EventArgs.cs:589

MyCaffe.common.SnapshotArgs.IncludeState
bool IncludeState
Get/set whether or not to include the Solver state in the snapshot.
Definition: EventArgs.cs:562

MyCaffe.common.SnapshotArgs.OnGetState
EventHandler< GetBytesArgs > OnGetState
Specifies the OnGetState event which fires when the SnapshotArgs::UpdateState method is called.
Definition: EventArgs.cs:444

MyCaffe.common.SnapshotArgs.UpdateDatabase
bool UpdateDatabase
Get/set whether or not to update the database (default = true).
Definition: EventArgs.cs:598

MyCaffe.common.SnapshotArgs.OnGetWeights
EventHandler< GetBytesArgs > OnGetWeights
Specifies the OnGetWeights event which fires when the SnapshotArgs::UpdateWeights method is called.
Definition: EventArgs.cs:437

MyCaffe.common.TestArgs
The TestArgs are passed to the Solver::OnTest event.
Definition: EventArgs.cs:169

MyCaffe.common.TestArgs.Accuracy
double Accuracy
Get/set the accuracy for the test run. When overriding the testing, the override should set the accur...
Definition: EventArgs.cs:205

MyCaffe.common.TestResultArgs
The TestResultArgs are passed to the Solver::OnTestResults event.
Definition: EventArgs.cs:116

MyCaffe.common.TestResultArgs.AccuracyValid
bool AccuracyValid
Get/set the accuracy valid flag. When not valid, the OnTestResults event is ignored.
Definition: EventArgs.cs:156

MyCaffe.common.TestResultArgs.Accuracy
double Accuracy
Get/set the accuracy. The recipient of this event should set this value.
Definition: EventArgs.cs:143

MyCaffe.common.TestingIterationArgs
Specifies the TestingIterationArgs sent to the Solver::OnTestingIteration, which is called at the end...
Definition: EventArgs.cs:216

MyCaffe.common.TrainingIterationArgs
The TrainingIterationArgs is sent to the Solver::OnTrainingIteration event that fires at the end of a...
Definition: EventArgs.cs:264

MyCaffe.common.WorkspaceArgs
The WorkspaceArgs are passed to both the Layer::OnSetWorkspace and Layer::OnGetWorkspace events.
Definition: EventArgs.cs:17

MyCaffe.common.WorkspaceArgs.WorkspaceData
long WorkspaceData
Get/set the handle to workspace data in GPU memory.
Definition: EventArgs.cs:36

MyCaffe.common.WorkspaceArgs.WorkspaceSizeInBytes
ulong WorkspaceSizeInBytes
Get/set the workspace memory size in bytes.
Definition: EventArgs.cs:45

MyCaffe.db.image.Database
The Database class manages the actual connection to the physical database using Entity Framworks from...
Definition: Database.cs:23

MyCaffe.param.NetParameter
Specifies the parameters use to create a Net
Definition: NetParameter.cs:18

MyCaffe.param.NetParameter.FromProto
static NetParameter FromProto(RawProto rp)
Parse a RawProto into a new instance of the parameter.
Definition: NetParameter.cs:242

MyCaffe.param.NetParameter.state
NetState state
The current 'state' of the network, including the phase, level and stage. Some layers may be included...
Definition: NetParameter.cs:147

MyCaffe.param.NetParameter.ProjectID
int ProjectID
Specifies the ID of the project that created this net param (if any).
Definition: NetParameter.cs:80

MyCaffe.param.NetParameter.solver_rank
int solver_rank
Specifies the rank of the solver using this network.
Definition: NetParameter.cs:189

MyCaffe.param.NetParameter.solver_count
int solver_count
Specifies the number of solvers used in a multi-gpu training session.
Definition: NetParameter.cs:179

MyCaffe.param.NetParameter.Clone
NetParameter Clone(bool bCloneLayers=true, int? nSolverCount=null, int? nSolverRank=null)
Creates a new copy of this instance of the parameter.
Definition: NetParameter.cs:314

MyCaffe.param.NetState
Specifies the NetState which includes the phase, level and stage for which a given Net is to run unde...
Definition: NetState.cs:19

MyCaffe.param.NetState.phase
Phase phase
Specifies the Phase of the NetState.
Definition: NetState.cs:63

MyCaffe.param.NetState.MergeFrom
void MergeFrom(NetState ns)
Merges another NetState with this instance.
Definition: NetState.cs:98

MyCaffe.param.SolverParameter
The SolverParameter is a parameter for the solver, specifying the train and test networks.
Definition: SolverParameter.cs:32

MyCaffe.param.SolverParameter.max_iter
int max_iter
The maximum number of iterations.
Definition: SolverParameter.cs:435

MyCaffe.param.SolverParameter.test_iter
List< int > test_iter
The number of iterations for each test.
Definition: SolverParameter.cs:359

MyCaffe.param.SolverParameter.net_param
NetParameter net_param
Inline train net param, possibly combined with one or more test nets.
Definition: SolverParameter.cs:294

MyCaffe.param.SolverParameter.debug_info
bool debug_info
If true, print information about the state of the net that may help with debugging learning problems.
Definition: SolverParameter.cs:890

MyCaffe.param.SolverParameter.train_net_param
NetParameter train_net_param
Inline train net param, possibly combined with one or more test nets.
Definition: SolverParameter.cs:304

MyCaffe.param.SolverParameter.test_state
List< NetState > test_state
The states for the train/test nets. Must be unspecified or specified once per net.
Definition: SolverParameter.cs:348

MyCaffe.param.SolverParameter.SolverType
SolverType
Defines the type of solver.
Definition: SolverParameter.cs:113

MyCaffe.param.SolverParameter.lr_policy
string lr_policy
The learning rate decay policy.
Definition: SolverParameter.cs:565

MyCaffe.param.SolverParameter.FromProto
static SolverParameter FromProto(RawProto rp)
Parses a new SolverParameter from a RawProto.
Definition: SolverParameter.cs:1092

MyCaffe.param.SolverParameter.ap_version
ApVersion ap_version
Specifies the AP Version to use for average precision when using Single-Shot Detection (SSD) - (defau...
Definition: SolverParameter.cs:934

MyCaffe.param.SolverParameter.random_seed
long random_seed
If non-negative, the seed with which the Solver will initialize the caffe random number generator – u...
Definition: SolverParameter.cs:810

MyCaffe.param.SolverParameter.average_loss
int average_loss
Display the loss averaged over the last average_loss iterations.
Definition: SolverParameter.cs:424

MyCaffe.param.SolverParameter.test_interval
int test_interval
The number of iterations between two testing phases.
Definition: SolverParameter.cs:370

MyCaffe.param.SolverParameter.output_average_results
bool output_average_results
Specifies to average loss results before they are output - this can be faster when there are a lot of...
Definition: SolverParameter.cs:256

MyCaffe.param.SolverParameter.iter_size
int iter_size
Accumulate gradients over 'iter_size' x 'batch_size' instances.
Definition: SolverParameter.cs:446

MyCaffe.param.SolverParameter.DebugString
string DebugString()
Returns a debug string for the SolverParameter.
Definition: SolverParameter.cs:1342

MyCaffe.param.SolverParameter.EvaluationType
EvaluationType
Defines the evaluation method used in the SSD algorithm.
Definition: SolverParameter.cs:87

MyCaffe.param.SolverParameter.snapshot_after_train
bool snapshot_after_train
If false, don't save a snapshot after training finishes.
Definition: SolverParameter.cs:912

MyCaffe.param.SolverParameter.snapshot_include_weights
bool snapshot_include_weights
Specifies whether or not the snapshot includes the trained weights. The default = true.
Definition: SolverParameter.cs:776

MyCaffe.param.SolverParameter.test_compute_loss
bool test_compute_loss
Test the compute loss.
Definition: SolverParameter.cs:380

MyCaffe.param.SolverParameter.SolverParameter
SolverParameter()
The SolverParameter constructor.
Definition: SolverParameter.cs:235

MyCaffe.param.SolverParameter.eval_type
EvaluationType eval_type
Specifies the evaluation type to use when using Single-Shot Detection (SSD) - (default = NONE,...
Definition: SolverParameter.cs:923

MyCaffe.param.SolverParameter.test_initialization
bool test_initialization
If true, run an initial test pass before the first iteration, ensuring memory availability and printi...
Definition: SolverParameter.cs:392

MyCaffe.param.SolverParameter.test_net_param
List< NetParameter > test_net_param
Inline test net params.
Definition: SolverParameter.cs:314

MyCaffe.param.SolverParameter.display
int display
The number of iterations between displaying info. If display = 0, no info will be displayed.
Definition: SolverParameter.cs:414

MyCaffe.param.SolverParameter.snapshot_diff
bool snapshot_diff
Whether to snapshot diff in the results or not. Snapshotting diff will help debugging but the final p...
Definition: SolverParameter.cs:751

MyCaffe.param.SolverParameter.snapshot_include_state
bool snapshot_include_state
Specifies whether or not the snapshot includes the solver state. The default = false....
Definition: SolverParameter.cs:787

MyCaffe.param.SolverParameter.show_per_class_result
bool show_per_class_result
Specifies whether or not to display results per class when using Single-Shot Detection (SSD) - (defau...
Definition: SolverParameter.cs:945

MyCaffe.param.SolverParameter.accuracy_average_window
int accuracy_average_window
Specifies the window over which to average the accuracies (default = 0 which ignores averaging).
Definition: SolverParameter.cs:955

MyCaffe.param.SolverParameter.snapshot
int snapshot
Specifies the snapshot interval.
Definition: SolverParameter.cs:728

MyCaffe.param.SolverParameter.type
SolverType type
Specifies the solver type.
Definition: SolverParameter.cs:828

MyCaffe.param.SolverParameter.train_state
NetState train_state
The states for the train/test nets. Must be unspecified or specified once per net.
Definition: SolverParameter.cs:331

MyCaffe.solvers.AdaDeltaSolver
Use AdaDelta Solver which has gradient based optimization like SGD.
Definition: AdaDeltaSolver.cs:22

MyCaffe.solvers.AdaGradSolver
Use AdaGrad Solver based optimization like SGD that tries to find rarely seen features.
Definition: AdaGradSolver.cs:22

MyCaffe.solvers.AdamSolver
Use Adam Solver which uses gradient based optimization like SGD that includes 'adaptive momentum esti...
Definition: AdamSolver.cs:22

MyCaffe.solvers.AdamWSolver
Use AdamW Solver which uses gradient based optimization like Adam with a decoupled weight decay.
Definition: AdamWSolver.cs:23

MyCaffe.solvers.NesterovSolver
Use Nesterov's accelerated gradient Solver, which is similar to SGD, but the error gradient is comput...
Definition: NesterovSolver.cs:23

MyCaffe.solvers.RmsPropSolver
Use RmsProp Solver which uses gradient based optimization like SGD.
Definition: RmsPropSolver.cs:23

MyCaffe.solvers.SGDSolver
Stochastic Gradient Descent solver with momentum updates weights by a linear combination of the negat...
Definition: SGDSolver.cs:22

MyCaffe.solvers.Solver
An interface for classes that perform optimization on Nets - this class serves as the base class for ...
Definition: Solver.cs:28

MyCaffe.solvers.Solver.m_rgTestNets
List< Net< T > > m_rgTestNets
Specifies the testing Nets.
Definition: Solver.cs:48

MyCaffe.solvers.Solver.TrainingIterations
int TrainingIterations
Returns the current training iterations remaining.
Definition: Solver.cs:708

MyCaffe.solvers.Solver.InitTestNets
void InitTestNets()
Initializes the Net used by the Solver for testing.
Definition: Solver.cs:579

MyCaffe.solvers.Solver.OnCustomForwardBack
EventHandler< CustomForwardBackArgs< T > > OnCustomForwardBack
The OnCustomForwardBack allows for overriding the forward/backward operations within the solver.
Definition: Solver.cs:155

MyCaffe.solvers.Solver.m_nSolverCount
int m_nSolverCount
Specifies the Solver count in a multi-GPU training session.
Definition: Solver.cs:82

MyCaffe.solvers.Solver.Dispose
void Dispose()
Discards the resources (GPU and Host) used by this Solver.
Definition: Solver.cs:218

MyCaffe.solvers.Solver.m_dfSmoothedLoss
double m_dfSmoothedLoss
Specifies the smoothed loss protected for derived classes to use.
Definition: Solver.cs:70

MyCaffe.solvers.Solver.m_param
SolverParameter m_param
Specifies the SolverParameter that defines how the Solver operates.
Definition: Solver.cs:40

MyCaffe.solvers.Solver.OnTrainingIteration
EventHandler< TrainingIterationArgs< T > > OnTrainingIteration
The OnTrainingIteration event fires at the end of each training iteration.
Definition: Solver.cs:134

MyCaffe.solvers.Solver.m_rgLosses
List< double > m_rgLosses
Specifies the Losses used to calculate the smoothed Loss.
Definition: Solver.cs:60

MyCaffe.solvers.Solver.SnapshotSolverState
abstract byte[] SnapshotSolverState()
Save the current solver state.

MyCaffe.solvers.Solver.Create
static SGDSolver< T > Create(CudaDnn< T > cuda, Log log, ProjectEx p, CancelEvent evtCancel, AutoResetEvent evtForceSnapshot, AutoResetEvent evtForceTest, IXDatabaseBase db, IXPersist< T > persist, int nSolverCount=1, int nSolverRank=0, Net< T > shareNet=null, onGetWorkspace getws=null, onSetWorkspace setws=null)
Create a new Solver based on the project containing the SolverParameter.
Definition: Solver.cs:1889

MyCaffe.solvers.Solver.smoothed_loss
double smoothed_loss
Returns the smoothed loss.
Definition: Solver.cs:1213

MyCaffe.solvers.Solver.Restore
void Restore(byte[] rgWeights, byte[] rgState, string strSkipBlobTypes=null)
The restore method simply calls the RestoreSolverState method of the inherited class.
Definition: Solver.cs:1097

MyCaffe.solvers.Solver.iter
int iter
Returns the current training iteration.
Definition: Solver.cs:1245

MyCaffe.solvers.Solver.m_cuda
CudaDnn< T > m_cuda
Specifies the instance of CudaDnn used by the Solver that provides a connection to Cuda.
Definition: Solver.cs:32

MyCaffe.solvers.Solver.Snapshot
void Snapshot(bool bForced, bool bScheduled, bool bUpdateDatabase=true)
The snapshot function implements the basic snapshotting utility that stores the learned net....
Definition: Solver.cs:1115

MyCaffe.solvers.Solver.MaximumIteration
int MaximumIteration
Returns the maximum training iterations.
Definition: Solver.cs:700

MyCaffe.solvers.Solver.m_dfIterAccuracy
double? m_dfIterAccuracy
Specifies the iteration accuracy calculated when a blob exists with the name 'accuracy'.
Definition: Solver.cs:74

MyCaffe.solvers.Solver.Solver
Solver(CudaDnn< T > cuda, Log log, SolverParameter p, CancelEvent evtCancel, AutoResetEvent evtForceSnapshot, AutoResetEvent evtForceTest, IXDatabaseBase db, IXPersist< T > persist, int nSolverCount=1, int nSolverRank=0, Net< T > shareNet=null, onGetWorkspace getws=null, onSetWorkspace setws=null)
The Solver constructor.
Definition: Solver.cs:181

MyCaffe.solvers.Solver.OnSnapshot
EventHandler< SnapshotArgs > OnSnapshot
The OnSnapshot event fires when the Solver detects that a snapshot is needed.
Definition: Solver.cs:130

MyCaffe.solvers.Solver.EnableBlobDebugging
bool EnableBlobDebugging
When enabled, the OnTrainingIteration event is set extra debugging information describing the state o...
Definition: Solver.cs:361

MyCaffe.solvers.Solver.type
SolverParameter.SolverType type
Returns the type of solver.
Definition: Solver.cs:1253

MyCaffe.solvers.Solver.net
Net< T > net
Returns the main training Net.
Definition: Solver.cs:1229

MyCaffe.solvers.Solver.ForceOnTrainingIterationEvent
bool ForceOnTrainingIterationEvent()
Force an OnTrainingIterationEvent to fire.
Definition: Solver.cs:236

MyCaffe.solvers.Solver.Tag
object Tag
Returns a generic tag associated with the Solver.
Definition: Solver.cs:422

MyCaffe.solvers.Solver.TestDetection
double TestDetection(int nIterationOverride=-1, int nTestNetId=0)
Run an SSD detection test on a given test Net by running it through its iterations.
Definition: Solver.cs:1396

MyCaffe.solvers.Solver.is_root_solver
bool? is_root_solver
Returns whether or not this is the root solver.
Definition: Solver.cs:1309

MyCaffe.solvers.Solver.LearningRateOverride
double LearningRateOverride
Get/set the learning rate override. When 0, this setting is ignored.
Definition: Solver.cs:227

MyCaffe.solvers.Solver.EnableTesting
bool EnableTesting
When enabled, the training cycle calls TestAll periodically based on the SolverParameter....
Definition: Solver.cs:352

MyCaffe.solvers.Solver.m_nIter
int m_nIter
Specifies the current iteration.
Definition: Solver.cs:52

MyCaffe.solvers.Solver.TrainingNet
Net< T > TrainingNet
Returns the training Net used by the solver.
Definition: Solver.cs:445

MyCaffe.solvers.Solver.m_dfLearningRateOverride
double m_dfLearningRateOverride
Optionally, specifies a learning rate override (default = 0, which ignores this setting).
Definition: Solver.cs:94

MyCaffe.solvers.Solver.OnTestingIteration
EventHandler< TestingIterationArgs< T > > OnTestingIteration
The OnTestingIteration event fires at the end of each testing iteration.
Definition: Solver.cs:138

MyCaffe.solvers.Solver.InitTrainNet
void InitTrainNet(Net< T > shareNet=null)
Initializes the Net used by the solver for training.
Definition: Solver.cs:488

MyCaffe.solvers.Solver.RestoreSolverState
abstract void RestoreSolverState(byte[] rgState)
Restore a solver state.

MyCaffe.solvers.Solver.UpdateSmoothedLoss
void UpdateSmoothedLoss(double dfLoss, int nStartIter, int nAverageLoss=0)
Update the avaraged loss value.
Definition: Solver.cs:1826

MyCaffe.solvers.Solver.Init
void Init(SolverParameter p, Net< T > shareNet=null)
Initializes the Solver.
Definition: Solver.cs:454

MyCaffe.solvers.Solver.EnableBreakOnFirstNaN
bool EnableBreakOnFirstNaN
When enabled (requires EnableBlobDebugging = true), the Solver immediately stop training upon detecti...
Definition: Solver.cs:382

MyCaffe.solvers.Solver.solver_count
int solver_count
Returns the solver count in a multi-GPU session.
Definition: Solver.cs:1290

MyCaffe.solvers.Solver.parameter
SolverParameter parameter
Returns the SolverParameter used.
Definition: Solver.cs:1221

MyCaffe.solvers.Solver.forceSnapshot
bool forceSnapshot
Returns whether or not a snapshot has been forced.
Definition: Solver.cs:1261

MyCaffe.solvers.Solver.SnapshotWeightUpdateMethod
SNAPSHOT_WEIGHT_UPDATE_METHOD SnapshotWeightUpdateMethod
Get/set the snapshot weight update method.
Definition: Solver.cs:301

MyCaffe.solvers.Solver.OnAborted
EventHandler OnAborted
The OnAborted event fires after aborting a training cycle.
Definition: Solver.cs:122

MyCaffe.solvers.Solver.test_nets
List< Net< T > > test_nets
Returns the testing Nets.
Definition: Solver.cs:1237

MyCaffe.solvers.Solver.m_persist
IXPersist< T > m_persist
Specifies the persistance object used to save weight and solver states.
Definition: Solver.cs:90

MyCaffe.solvers.Solver.TrainingTimeLimitInMinutes
int TrainingTimeLimitInMinutes
Get/set the training time limit in minutes. When set to 0, no time limit is imposed on training.
Definition: Solver.cs:292

MyCaffe.solvers.Solver.OnGetWorkspace
EventHandler< WorkspaceArgs > OnGetWorkspace
Specifies the OnGetWorkspace event that fires when the getWorkspace() function is called by a layer t...
Definition: Solver.cs:159

MyCaffe.solvers.Solver.TestClassification
double TestClassification(int nIterationOverride=-1, int nTestNetId=0)
Run a test on a given test Net by running it through its iterations.
Definition: Solver.cs:1597

MyCaffe.solvers.Solver.Reset
void Reset()
Reset the iterations of the net.
Definition: Solver.cs:478

MyCaffe.solvers.Solver.Step
bool Step(int nIters, TRAIN_STEP step=TRAIN_STEP.NONE, bool bZeroDiffs=true, bool bApplyUpdates=true, bool bDisableOutput=false, bool bDisableProgress=false, double? dfLossOverride=null, bool? bAllowSnapshot=null)
Steps a set of iterations through a training cycle.
Definition: Solver.cs:818

MyCaffe.solvers.Solver.TestAll
double TestAll(int nIterationOverride=-1)
Run a TestAll by running all test Nets.
Definition: Solver.cs:1322

MyCaffe.solvers.Solver.LabelQueryEpochs
string LabelQueryEpochs
Return the label query epochs for the active datasource.
Definition: Solver.cs:684

MyCaffe.solvers.Solver.OnTestResults
EventHandler< TestResultArgs< T > > OnTestResults
When specified, the OnTestResults event fires after each single test run. The recipient is responsibl...
Definition: Solver.cs:142

MyCaffe.solvers.Solver.OnGradientsReady
EventHandler< GradientsReadyArgs > OnGradientsReady
The OnGradientsReady event fires after the gradients of a Solver are ready for distribution to other ...
Definition: Solver.cs:126

MyCaffe.solvers.Solver.OnSetWorkspace
EventHandler< WorkspaceArgs > OnSetWorkspace
Specifies the OnSetWorkspace event that fires when the setWorkspace() function is called by a layer t...
Definition: Solver.cs:163

MyCaffe.solvers.Solver.TestingIterations
int? TestingIterations
Returns the current testing iterations remaining.
Definition: Solver.cs:724

MyCaffe.solvers.Solver.Create
static SGDSolver< T > Create(CudaDnn< T > cuda, Log log, SolverParameter solverParam, CancelEvent evtCancel, AutoResetEvent evtForceSnapshot, AutoResetEvent evtForceTest, IXDatabaseBase db, IXPersist< T > persist, int nSolverCount=1, int nSolverRank=0, Net< T > shareNet=null, onGetWorkspace getws=null, onSetWorkspace setws=null)
Create a new Solver based on the project containing the SolverParameter.
Definition: Solver.cs:1930

MyCaffe.solvers.Solver.forceTest
bool forceTest
Returns whether or not a test has been forced.
Definition: Solver.cs:1275

MyCaffe.solvers.Solver.TrainingIterationOverride
int TrainingIterationOverride
Get/set the training iteration override.
Definition: Solver.cs:1179

MyCaffe.solvers.Solver.OnTestStart
EventHandler OnTestStart
The OnTestStart event fires at the start of each testing iteration.
Definition: Solver.cs:150

MyCaffe.solvers.Solver.m_net
Net< T > m_net
Specifies the training Net.
Definition: Solver.cs:44

MyCaffe.solvers.Solver.WeightsUpdated
bool WeightsUpdated
Get/set when the weights have been updated.
Definition: Solver.cs:413

MyCaffe.solvers.Solver.m_nCurrentStep
int m_nCurrentStep
Specifies the current step.
Definition: Solver.cs:56

MyCaffe.solvers.Solver.solver_rank
int solver_rank
Returns this Solver's rank in a multi-GPU session.
Definition: Solver.cs:1298

MyCaffe.solvers.Solver.EnableDetailedNanDetection
bool EnableDetailedNanDetection
When enabled (requires EnableBlobDebugging = true), the detailed Nan (and Infinity) detection is pero...
Definition: Solver.cs:395

MyCaffe.solvers.Solver.m_log
Log m_log
Specifies the Log for output.
Definition: Solver.cs:36

MyCaffe.solvers.Solver.GetSnapshotArgs
SnapshotArgs GetSnapshotArgs(byte[] rgState, byte[] rgWeights, double dfAccuracy, double dfError, int nIteration, SNAPSHOT_WEIGHT_UPDATE_METHOD wtUpdt)
The GetSnapshotArgs method fills out a snapshot args structure.
Definition: Solver.cs:1159

MyCaffe.solvers.Solver.dispose
virtual void dispose()
Override that allows discarding of resources (GPU and Host) used by this Solver.
Definition: Solver.cs:317

MyCaffe.solvers.Solver.OnTest
EventHandler< TestArgs > OnTest
When specified, the OnTest event fires during a TestAll and overrides the call to Test.
Definition: Solver.cs:146

MyCaffe.solvers.Solver.TestingIterationOverride
int TestingIterationOverride
Get/set the testing iteration override.
Definition: Solver.cs:1188

MyCaffe.solvers.Solver.Solve
virtual void Solve(int nIterationOverride=-1, byte[] rgWeights=null, byte[] rgState=null, TRAIN_STEP step=TRAIN_STEP.NONE)
The main entry of the solver function. In default, iter will be zero. Pass in a non-zero iter number ...
Definition: Solver.cs:744

MyCaffe.solvers.Solver.OnStart
EventHandler OnStart
The OnStart event fires at the start of each training iteration.
Definition: Solver.cs:118

MyCaffe.solvers.Solver.ActiveLabelCounts
string ActiveLabelCounts
Returns a string describing the labels detected in the training along with the % that each label has ...
Definition: Solver.cs:668

MyCaffe.solvers.Solver.CompletedEvent
AutoResetEvent CompletedEvent
Returns an auto reset event that is set upon training completion.
Definition: Solver.cs:1197

MyCaffe.solvers.Solver.ApplyUpdate
abstract double ApplyUpdate(int nIterationOverride=-1)
Make and apply the update value for the current iteration.

MyCaffe.solvers.Solver.Cuda
CudaDnn< T > Cuda
Returns the CudaDnn instance used by the Solver.
Definition: Solver.cs:660

MyCaffe.solvers.Solver.EnableSingleStep
bool EnableSingleStep
When enabled (requires EnableBlobDebugging = true), the Solver only runs one training cycle.
Definition: Solver.cs:404

MyCaffe.solvers.Solver.m_nSolverRank
int m_nSolverRank
Specifies the Solver rank of this solver, where rank == 0 is the root Solver.
Definition: Solver.cs:86

MyCaffe.solvers.Solver.LabelQueryHitPercents
string LabelQueryHitPercents
Return the label query hit percentages for the active datasource.
Definition: Solver.cs:676

MyCaffe.solvers.Solver.TestingNet
Net< T > TestingNet
Returns the testing Net used by the solver.
Definition: Solver.cs:431

MyCaffe.solvers.Solver.EnableLayerDebugging
bool EnableLayerDebugging
Enable/disable layer debugging which causes each layer to check for NAN/INF on each forward/backward ...
Definition: Solver.cs:373

MyCaffe.solvers.Solver.CurrentIteration
int CurrentIteration
Returns the current training iteration.
Definition: Solver.cs:692

MyCaffe.basecode.IXDatabaseBase
The IXDatabaseBase interface defines the general interface to the in-memory database.
Definition: Interfaces.cs:444

MyCaffe.common.IXPersist
The IXPersist interface is used by the CaffeControl to load and save weights.
Definition: Interfaces.cs:187

MyCaffe.basecode
The MyCaffe.basecode contains all generic types used throughout MyCaffe.
Definition: Annotation.cs:12

MyCaffe.basecode.Phase
Phase
Defines the Phase under which to run a Net.
Definition: Interfaces.cs:61

MyCaffe.basecode.SNAPSHOT_WEIGHT_UPDATE_METHOD
SNAPSHOT_WEIGHT_UPDATE_METHOD
Defines the snapshot weight update method.
Definition: Interfaces.cs:181

MyCaffe.common
The MyCaffe.common namespace contains common MyCaffe classes.
Definition: BatchInput.cs:8

MyCaffe.common.BLOB_TYPE
BLOB_TYPE
Defines the tpe of data held by a given Blob.
Definition: Interfaces.cs:62

MyCaffe.common.TRAIN_STEP
TRAIN_STEP
Defines the training stepping method (if any).
Definition: Interfaces.cs:131

MyCaffe.db.image
The MyCaffe.db.image namespace contains all image database related classes.
Definition: Database.cs:18

MyCaffe.db
Definition: Database.cs:18

MyCaffe.param
The MyCaffe.param namespace contains parameters used to create models.
Definition: AttentionParameter.cs:9

MyCaffe.solvers
The MyCaffe.solvers namespace contains all solver classes, including the base Solver.
Definition: AdaDeltaSolver.cs:13

MyCaffe
The MyCaffe namespace contains the main body of MyCaffe code that closesly tracks the C++ Caffe open-...
Definition: Annotation.cs:12

System
Definition: Component.cs:11