mycaffe/html/_parallel_8cs_source.html

using System;

using System.Collections.Generic;

using System.Diagnostics;

using System.Linq;

using System.Text;

using System.Threading;

using System.Threading.Tasks;

using MyCaffe.basecode;

using MyCaffe.param;

using MyCaffe.solvers;


namespace MyCaffe.common

{

    public class Params<T>

    {

        protected long m_lCount;


        protected long m_lExtra;


        protected long m_hData;

        protected long m_hDiff;

        protected int m_nDeviceID;


        public Params(Solver<T> root_solver)

        {

            m_lCount = total_size(root_solver.net.learnable_parameters);

            m_lExtra = 1000;

            m_hData = 0;

            m_hDiff = 0;


            m_lCount += m_lExtra;

        }


        public long count

        {

            get { return m_lCount; }

        }


        public long data

        {

            get { return m_hData; }

        }


        public long diff

        {

            get { return m_hDiff; }

        }


        private long total_size(BlobCollection<T> rgParam)

        {

            long nSize = 0;


            for (int i = 0; i < rgParam.Count; i++)

            {

                nSize += (long)rgParam[i].count();

            }


            // Size should have at least one byte, otherwise malloc fails

            //  if net has no learnable parameters.

            if (nSize == 0)

                nSize++;


            return nSize;

        }

    }


    public class GPUParams<T> : Params<T>, IDisposable

    {

        protected CudaDnn<T> m_cuda;

        protected Log m_log;

        protected long m_hStream;


        public enum Op

        {

            copy,

            replace_gpu,

            replace_gpu_diff

        }


        public GPUParams(CudaDnn<T> cuda, Log log, Solver<T> root_solver, int nDeviceID)

            : base(root_solver)

        {

            m_cuda = cuda;

            m_log = log;


            m_nDeviceID = m_cuda.GetDeviceID();


            if (nDeviceID != m_nDeviceID)

                m_cuda.SetDeviceID(nDeviceID);


            // Allocate device buffers

            m_hData = m_cuda.AllocMemory(m_lCount);


            // Copy blob values

            BlobCollection<T> net = root_solver.net.learnable_parameters;

            apply_buffers(net, m_hData, m_lCount, Op.copy);


            m_hDiff = m_cuda.AllocMemory(m_lCount);

            m_cuda.set((int)m_lCount, m_hDiff, 0);


            m_hStream = m_cuda.CreateStream();


            if (m_nDeviceID != nDeviceID)

                m_cuda.SetDeviceID(m_nDeviceID);

        }


        public void Dispose()

        {

            if (m_hData != 0)

            {

                m_cuda.FreeMemory(m_hData);

                m_hData = 0;

            }


            if (m_hDiff != 0)

            {

                m_cuda.FreeMemory(m_hDiff);

                m_hDiff = 0;

            }


            if (m_hStream != 0)

            {

                m_cuda.FreeStream(m_hStream);

                m_hStream = 0;

            }

        }


        public void SynchronizeStream()

        {

            m_cuda.SynchronizeStream(m_hStream);

        }


        public void Configure(Solver<T> solver)

        {

            BlobCollection<T> net = solver.net.learnable_parameters;

            apply_buffers(net, m_hData, m_lCount, Op.replace_gpu);

            apply_buffers(net, m_hDiff, m_lCount, Op.replace_gpu_diff);

        }


        public void apply_buffers(BlobCollection<T> rgBlobs, long hBuffer, long lTotalSize, Op op)

        {

            long lOffset = 0;


            for (int i = 0; i < rgBlobs.Count; i++)

            {

                int nCount = rgBlobs[i].count();


                switch (op)

                {

                    // Init buffer to current values of blobs

                    case Op.copy:

                        m_cuda.copy(nCount, rgBlobs[i].data.gpu_data, hBuffer, 0, (int)lOffset);

                        break;


                    case Op.replace_gpu:

                        rgBlobs[i].data.set_gpu_data(hBuffer, nCount, lOffset);

                        break;


                    case Op.replace_gpu_diff:

                        if (rgBlobs[i].DiffExists)

                            rgBlobs[i].diff.set_gpu_data(hBuffer, nCount, lOffset);

                        break;

                }


                lOffset += nCount;

            }


            // total_size is at least one byte

            // We allocate extra items past the items used as a pad.

            m_log.CHECK_EQ(lTotalSize - m_lExtra, (lOffset == 0) ? 1 : lOffset, "The total memory doesn't match.");

        }

    }


    public class NCCL<T> : GPUParams<T>, IDisposable

    {

        long m_hNccl;

        Solver<T> m_solver;

        ManualResetEvent m_evtGradientsReady = new ManualResetEvent(false);

        List<ManualResetEvent> m_rgGradientReady = new List<ManualResetEvent>();


        public NCCL(CudaDnn<T> cuda, Log log, Solver<T> root_solver, int nDeviceID, long hNccl, List<ManualResetEvent> rgGradientReadyEvents)

            : base(cuda, log, root_solver, nDeviceID)

        {

            m_rgGradientReady = rgGradientReadyEvents;

            if (rgGradientReadyEvents != null && rgGradientReadyEvents.Count > 0)

                m_evtGradientsReady = rgGradientReadyEvents[root_solver.solver_rank];


            m_solver = root_solver;

            m_hNccl = hNccl;

            Configure(root_solver);


            root_solver.OnGradientsReady += Solver_OnGradientsReady;

        }


        public new void Dispose()

        {

            base.Dispose();


            if (m_hNccl != 0)

            {

                m_cuda.FreeNCCL(m_hNccl);

                m_hNccl = 0;

            }

        }


        public void Broadcast()

        {

            m_cuda.NcclBroadcast(m_hNccl, m_hStream, m_hData, (int)m_lCount);

            m_cuda.SynchronizeStream(m_hStream);

        }


        private void Solver_OnGradientsReady(object sender, GradientsReadyArgs e)

        {

            try

            {

                m_cuda.SynchronizeStream();

                m_evtGradientsReady.Set();


                while (!WaitHandle.WaitAll(m_rgGradientReady.ToArray(), 250))

                {

                    if (m_solver.CancelEvent.WaitOne(0))

                        return;

                }


                double dfScale = 1.0 / m_solver.solver_count;

                m_cuda.NcclAllReduce(m_hNccl, m_hStream, m_hDiff, (int)m_lCount, NCCL_REDUCTION_OP.SUM, dfScale);

                m_cuda.SynchronizeStream(m_hStream);

            }

            finally

            {

                m_evtGradientsReady.Reset();

            }

        }


        public void Run(List<int> rgGpus, int nIterationOverride = -1)

        {

            List<long> rghNccl = new List<long>();

            Guid guid = Guid.NewGuid();


            m_rgGradientReady = new List<ManualResetEvent>();


            for (int i = 0; i < rgGpus.Count; i++)

            {

                long hNccl = m_cuda.CreateNCCL(rgGpus[i], m_solver.solver_count, i, guid);

                rghNccl.Add(hNccl);

                m_rgGradientReady.Add(new ManualResetEvent(false));

            }


            m_cuda.NcclInitializeSingleProcess(rghNccl.ToArray());

            m_hNccl = rghNccl[0];

            m_evtGradientsReady = m_rgGradientReady[0];


            List<WaitHandle> rgWaitAllInit = new List<WaitHandle>();

            List<Worker<T>> rgWorkers = new List<common.Worker<T>>();

            ManualResetEvent evtAllCreated = new ManualResetEvent(false);


            for (int i = 1; i < rghNccl.Count; i++)

            {

                Worker<T> worker = new Worker<T>();


                SolverInfo<T> info = new common.SolverInfo<T>(m_solver, m_cuda.KernelHandle, rghNccl[i], i, nIterationOverride, m_cuda.Path, m_rgGradientReady, evtAllCreated);

                worker.StartInternalThread(null, null, rgGpus[i], info);


                List<WaitHandle> rgWait = new List<WaitHandle>();

                rgWait.AddRange(m_solver.CancelEvent.Handles);

                rgWait.Add(info.ErrorEvent);

                rgWait.Add(info.StartedEvent);


                int nWait = WaitHandle.WaitAny(rgWait.ToArray());

                if (nWait < rgWait.Count - 2)

                    return;


                if (nWait == rgWait.Count - 2)

                {

                    if (info.Error != null)

                        throw info.Error;

                    else

                        throw new Exception("Error starting the solver.");

                }


                rgWaitAllInit.Add(info.InitializedEvent);

                rgWorkers.Add(worker);

            }


            // Wait for all worksers to initialize

            while (!WaitHandle.WaitAll(rgWaitAllInit.ToArray(), 250))

            {

                if (m_solver.CancelEvent.WaitOne(0))

                    return;

            }


            m_cuda.SynchronizeDevice();

            evtAllCreated.Set();


            // Run first solver on current thread.

            Broadcast();


            m_solver.Solve(nIterationOverride);


            // Wait for shutdown

            for (int i = 0; i < rgWorkers.Count; i++)

            {

                rgWorkers[i].StopInternalThread();

            }

        }

    }


    public class Worker<T> : InternalThread<T>

    {

        CudaDnn<T> m_cuda;


        public Worker()

        {

            this.DoWork += Worker_DoWork;

        }


        private void Worker_DoWork(object sender, ActionStateArgs<T> e)

        {

            SolverInfo<T> info = e.Arg as SolverInfo<T>;

            NCCL<T> nccl = null;


            m_cuda = new common.CudaDnn<T>(e.DeviceID, DEVINIT.CUBLAS | DEVINIT.CURAND, null, info.CudaPath);


            try

            {

                Solver<T> rank0 = info.Rank0;

                Log log = new Log("Worker solver for DeviceID = " + e.DeviceID.ToString());


                //-----------------------------------------

                //  Transfer the NCCL handle from the

                //  main kernel that created it to the

                //  one used by the CudaDnn on this thread.

                //

                //  After the copy, this thread will 'own'

                //  the nccl and be responsible for its

                //  destruction.

                //-----------------------------------------

                long hNccl = m_cuda.KernelCopyNccl(info.KernelHandle, info.NcclHandle);


                // Create solver and install callbacks

                SolverParameter param = rank0.parameter.Clone();

                param.device_id = e.DeviceID;

                param.type = rank0.parameter.type;

                Solver<T> solver = Solver<T>.Create(m_cuda, log, param, rank0.CancelEvent, null, null, rank0.Database, null, rank0.solver_count, info.SolverRank);

                info.StartedEvent.Set();

                log.CHECK_EQ((int)solver.type, (int)rank0.type, "The solver types should be the same.");


                //-----------------------------------------

                //  Turn off logging for all other

                //  operations on the worker thread.

                //-----------------------------------------

                log.Enable = false;


                nccl = new NCCL<T>(m_cuda, log, solver, e.DeviceID, hNccl, info.GradientReadyEvents);


                info.InitializedEvent.Set();

                m_cuda.SynchronizeDevice();


                List<WaitHandle> rgWait = new List<WaitHandle>();

                rgWait.AddRange(rank0.CancelEvent.Handles);

                rgWait.Add(info.AllCreatedEvent);


                int nWait = WaitHandle.WaitAny(rgWait.ToArray());

                if (nWait < rgWait.Count - 1)

                    return;


                nccl.Broadcast();


                int nIterations = param.max_iter - solver.iter;

                if (info.IterationOverride > 0)

                    nIterations = info.IterationOverride;


                solver.Step(nIterations);

                solver.Dispose();

            }

            catch (Exception excpt)

            {

                info.Error = excpt;

                info.ErrorEvent.Set();

            }

            finally

            {

                if (nccl != null)

                    nccl.Dispose();


                m_cuda.Dispose();

                m_cuda = null;

            }

        }

    }


    public class SolverInfo<T>

    {

        string m_strCudaPath;

        Solver<T> m_rank0;

        long m_hSrcKernel;

        long m_hSrcNccl;

        int m_nSolverRank;

        int m_nIterationOverride;

        ManualResetEvent m_evtInitialized = new ManualResetEvent(false);

        ManualResetEvent m_evtStarted = new ManualResetEvent(false);

        ManualResetEvent m_evtAllCreated = new ManualResetEvent(false);

        AutoResetEvent m_evtError = new AutoResetEvent(false);

        List<ManualResetEvent> m_rgGradientReadyEvents = null;

        Exception m_error = null;


        public SolverInfo(Solver<T> rank0, long hSrcKernel, long hSrcNccl, int nSolverRank, int nIterationOverride, string strCudaPath, List<ManualResetEvent> rgGradientReadyEvents, ManualResetEvent evtAllCreated)

        {

            m_strCudaPath = strCudaPath;

            m_rank0 = rank0;

            m_hSrcKernel = hSrcKernel;

            m_hSrcNccl = hSrcNccl;

            m_nSolverRank = nSolverRank;

            m_nIterationOverride = nIterationOverride;

            m_rgGradientReadyEvents = rgGradientReadyEvents;

            m_evtAllCreated = evtAllCreated;

        }


        public Solver<T> Rank0

        {

            get { return m_rank0; }

        }


        public string CudaPath

        {

            get { return m_strCudaPath; }

        }


        public int IterationOverride

        {

            get { return m_nIterationOverride; }

        }


        public long KernelHandle

        {

            get { return m_hSrcKernel; }

        }


        public long NcclHandle

        {

            get { return m_hSrcNccl; }

        }


        public int SolverRank

        {

            get { return m_nSolverRank; }

        }


        public ManualResetEvent InitializedEvent

        {

            get { return m_evtInitialized; }

        }


        public ManualResetEvent StartedEvent

        {

            get { return m_evtStarted; }

        }


        public ManualResetEvent AllCreatedEvent

        {

            get { return m_evtAllCreated; }

        }


        public List<ManualResetEvent> GradientReadyEvents

        {

            get { return m_rgGradientReadyEvents; }

        }


        public Exception Error

        {

            get { return m_error; }

            set { m_error = value; }

        }


        public AutoResetEvent ErrorEvent

        {

            get { return m_evtError; }

        }

    }

}

MyCaffe.basecode.CancelEvent.Handles
WaitHandle[] Handles
Returns the internal wait handle of the CancelEvent.
Definition: CancelEvent.cs:302

MyCaffe.basecode.CancelEvent.WaitOne
bool WaitOne(int nMs=int.MaxValue)
Waits for the signal state to occur.
Definition: CancelEvent.cs:290

MyCaffe.basecode.Log
The Log class provides general output in text form.
Definition: Log.cs:13

MyCaffe.basecode.Log.Enable
bool Enable
Enables/disables the Log. When disabled, the Log does not output any data.
Definition: Log.cs:42

MyCaffe.basecode.Log.CHECK_EQ
void CHECK_EQ(double df1, double df2, string str)
Test whether one number is equal to another.
Definition: Log.cs:239

MyCaffe.common.ActionStateArgs
The ActionStateArgs are sent to the DoWork event when fired from the InternalThreadEntry.
Definition: InternalThread.cs:195

MyCaffe.common.ActionStateArgs.Arg
object Arg
Returns the user supplied argument.
Definition: InternalThread.cs:260

MyCaffe.common.ActionStateArgs.DeviceID
int DeviceID
Returns the Device ID of the device to use in the thread.
Definition: InternalThread.cs:252

MyCaffe.common.BlobCollection
The BlobCollection contains a list of Blobs.
Definition: BlobCollection.cs:16

MyCaffe.common.BlobCollection.Count
int Count
Returns the number of items in the collection.
Definition: BlobCollection.cs:30

MyCaffe.common.CudaDnn
The CudaDnn object is the main interface to the Low-Level Cuda C++ DLL.
Definition: CudaDnn.cs:969

MyCaffe.common.GPUParams
The GPUParams contains the connection to the low-level Cuda, and the stream associated with this inst...
Definition: Parallel.cs:104

MyCaffe.common.GPUParams.m_hStream
long m_hStream
The handle to the Cuda stream used for synchronization.
Definition: Parallel.cs:116

MyCaffe.common.GPUParams.Configure
void Configure(Solver< T > solver)
Configure the GPU Params by copying the Solver training Net parameters into the data and diff buffers...
Definition: Parallel.cs:207

MyCaffe.common.GPUParams.GPUParams
GPUParams(CudaDnn< T > cuda, Log log, Solver< T > root_solver, int nDeviceID)
The GPUParams constructor.
Definition: Parallel.cs:144

MyCaffe.common.GPUParams.apply_buffers
void apply_buffers(BlobCollection< T > rgBlobs, long hBuffer, long lTotalSize, Op op)
Transfer between the data/diff buffers and a collection of Blobs (e.g. the learnable parameters).
Definition: Parallel.cs:221

MyCaffe.common.GPUParams.m_log
Log m_log
The Log used for output.
Definition: Parallel.cs:112

MyCaffe.common.GPUParams.SynchronizeStream
void SynchronizeStream()
Synchronize with the Cuda stream.
Definition: Parallel.cs:198

MyCaffe.common.GPUParams.Dispose
void Dispose()
Release all GPU and Host resources used.
Definition: Parallel.cs:174

MyCaffe.common.GPUParams.m_cuda
CudaDnn< T > m_cuda
The instance of CudaDnn that provides the connection to Cuda.
Definition: Parallel.cs:108

MyCaffe.common.GradientsReadyArgs
The GradientsReadyArgs is sent to the Solver::OnGradientsReady event which fires at the end of each S...
Definition: EventArgs.cs:734

MyCaffe.common.InternalThread
The InternalThread manages an internal thread used for Parallel and data collection operations.
Definition: InternalThread.cs:16

MyCaffe.common.InternalThread.StartInternalThread
void StartInternalThread(CudaDnn< T > cuda, Log log, int nDeviceID=0, object arg=null, int nInitialDelay=0)
Starts running the internal thread function which then calls the DoWork event.
Definition: InternalThread.cs:81

MyCaffe.common.InternalThread.DoWork
EventHandler< ActionStateArgs< T > > DoWork
The DoWork event is the working thread function.
Definition: InternalThread.cs:28

MyCaffe.common.NCCL
The NCCL class manages the multi-GPU operations using the low-level NCCL functionality provided by th...
Definition: Parallel.cs:267

MyCaffe.common.NCCL.Dispose
new void Dispose()
Release all GPU and Host resources used.
Definition: Parallel.cs:299

MyCaffe.common.NCCL.NCCL
NCCL(CudaDnn< T > cuda, Log log, Solver< T > root_solver, int nDeviceID, long hNccl, List< ManualResetEvent > rgGradientReadyEvents)
The NCCL constructor.
Definition: Parallel.cs:282

MyCaffe.common.NCCL.Run
void Run(List< int > rgGpus, int nIterationOverride=-1)
Run the root Solver and coordinate with all other Solver's participating in the multi-GPU training.
Definition: Parallel.cs:351

MyCaffe.common.NCCL.Broadcast
void Broadcast()
Broadcast the data to all other solvers participating in the multi-GPU session.
Definition: Parallel.cs:313

MyCaffe.common.Params
The Params contains the base parameters used in multi-GPU training.
Definition: Parallel.cs:19

MyCaffe.common.Params.data
long data
Returns the handle to the GPU memory containing the Net parameters.
Definition: Parallel.cs:69

MyCaffe.common.Params.Params
Params(Solver< T > root_solver)
The Param constructor.
Definition: Parallel.cs:47

MyCaffe.common.Params.m_lExtra
long m_lExtra
size of the padding added to the memory buffers.
Definition: Parallel.cs:28

MyCaffe.common.Params.count
long count
Returns the size of the buffers (in items).
Definition: Parallel.cs:61

MyCaffe.common.Params.m_lCount
long m_lCount
size of the buffers (in items).
Definition: Parallel.cs:23

MyCaffe.common.Params.diff
long diff
Returns the handle to the GPU memory containing the Net gradients.
Definition: Parallel.cs:77

MyCaffe.common.Params.m_hDiff
long m_hDiff
Handle to GPU memory containing the Net gradient.
Definition: Parallel.cs:37

MyCaffe.common.Params.m_hData
long m_hData
Handle to GPU memory containing the Net parameters.
Definition: Parallel.cs:33

MyCaffe.common.Params.m_nDeviceID
int m_nDeviceID
The Device ID.
Definition: Parallel.cs:41

MyCaffe.common.SolverInfo
The SolverInfo defines the user supplied arguments passed to each Worker.
Definition: Parallel.cs:520

MyCaffe.common.SolverInfo.IterationOverride
int IterationOverride
Returns the training iteration override to use.
Definition: Parallel.cs:577

MyCaffe.common.SolverInfo.ErrorEvent
AutoResetEvent ErrorEvent
Returns the event that is set when an error occurs.
Definition: Parallel.cs:650

MyCaffe.common.SolverInfo.Error
Exception Error
Returns the error (if any) that occured when running the solver thread.
Definition: Parallel.cs:641

MyCaffe.common.SolverInfo.SolverInfo
SolverInfo(Solver< T > rank0, long hSrcKernel, long hSrcNccl, int nSolverRank, int nIterationOverride, string strCudaPath, List< ManualResetEvent > rgGradientReadyEvents, ManualResetEvent evtAllCreated)
The SolverInfo constructor.
Definition: Parallel.cs:545

MyCaffe.common.SolverInfo.CudaPath
string CudaPath
Returns the file path to the low-level CudaDnnDll.DLL file to use. Note, when null or emtpy,...
Definition: Parallel.cs:569

MyCaffe.common.SolverInfo.StartedEvent
ManualResetEvent StartedEvent
Returns the event that is set after the Worker has started running.
Definition: Parallel.cs:617

MyCaffe.common.SolverInfo.KernelHandle
long KernelHandle
Returns a handle to the kernel where the NCCL for this Solver was created (typically this is the kern...
Definition: Parallel.cs:585

MyCaffe.common.SolverInfo.Rank0
Solver< T > Rank0
Returns rank Solver that will run in the Worker.
Definition: Parallel.cs:561

MyCaffe.common.SolverInfo.GradientReadyEvents
List< ManualResetEvent > GradientReadyEvents
Returns the event that is set after the gradients of the Solver in this Worker are ready.
Definition: Parallel.cs:633

MyCaffe.common.SolverInfo.NcclHandle
long NcclHandle
Returns the handle to the NCCL instance for this Solver (typically this is created on the kernel that...
Definition: Parallel.cs:593

MyCaffe.common.SolverInfo.AllCreatedEvent
ManualResetEvent AllCreatedEvent
Returns the event that is set after all Workers have been created.
Definition: Parallel.cs:625

MyCaffe.common.SolverInfo.InitializedEvent
ManualResetEvent InitializedEvent
Returns the event that is set after the Worker has completed initializing.
Definition: Parallel.cs:609

MyCaffe.common.SolverInfo.SolverRank
int SolverRank
Returns the rank of this Solver.
Definition: Parallel.cs:601

MyCaffe.common.Worker
The Worker manages each 'non' root sover running, where each Worker operates on a different GPU.
Definition: Parallel.cs:429

MyCaffe.common.Worker.Worker
Worker()
The Worker constructor.
Definition: Parallel.cs:435

MyCaffe.param.SolverParameter
The SolverParameter is a parameter for the solver, specifying the train and test networks.
Definition: SolverParameter.cs:32

MyCaffe.param.SolverParameter.max_iter
int max_iter
The maximum number of iterations.
Definition: SolverParameter.cs:435

MyCaffe.param.SolverParameter.Clone
SolverParameter Clone()
Creates a new copy of the SolverParameter.
Definition: SolverParameter.cs:244

MyCaffe.param.SolverParameter.device_id
int device_id
The device id that will be used when run on the GPU.
Definition: SolverParameter.cs:798

MyCaffe.param.SolverParameter.type
SolverType type
Specifies the solver type.
Definition: SolverParameter.cs:828

MyCaffe.solvers.Solver
An interface for classes that perform optimization on Nets - this class serves as the base class for ...
Definition: Solver.cs:28

MyCaffe.solvers.Solver.Dispose
void Dispose()
Discards the resources (GPU and Host) used by this Solver.
Definition: Solver.cs:218

MyCaffe.solvers.Solver.Create
static SGDSolver< T > Create(CudaDnn< T > cuda, Log log, ProjectEx p, CancelEvent evtCancel, AutoResetEvent evtForceSnapshot, AutoResetEvent evtForceTest, IXDatabaseBase db, IXPersist< T > persist, int nSolverCount=1, int nSolverRank=0, Net< T > shareNet=null, onGetWorkspace getws=null, onSetWorkspace setws=null)
Create a new Solver based on the project containing the SolverParameter.
Definition: Solver.cs:1889

MyCaffe.solvers.Solver.iter
int iter
Returns the current training iteration.
Definition: Solver.cs:1245

MyCaffe.solvers.Solver.type
SolverParameter.SolverType type
Returns the type of solver.
Definition: Solver.cs:1253

MyCaffe.solvers.Solver.net
Net< T > net
Returns the main training Net.
Definition: Solver.cs:1229

MyCaffe.solvers.Solver.solver_count
int solver_count
Returns the solver count in a multi-GPU session.
Definition: Solver.cs:1290

MyCaffe.solvers.Solver.CancelEvent
CancelEvent CancelEvent
Returns the cancel event which when set cancels the current operation run by the Solver.
Definition: Solver.cs:1205

MyCaffe.solvers.Solver.parameter
SolverParameter parameter
Returns the SolverParameter used.
Definition: Solver.cs:1221

MyCaffe.solvers.Solver.Step
bool Step(int nIters, TRAIN_STEP step=TRAIN_STEP.NONE, bool bZeroDiffs=true, bool bApplyUpdates=true, bool bDisableOutput=false, bool bDisableProgress=false, double? dfLossOverride=null, bool? bAllowSnapshot=null)
Steps a set of iterations through a training cycle.
Definition: Solver.cs:818

MyCaffe.solvers.Solver.OnGradientsReady
EventHandler< GradientsReadyArgs > OnGradientsReady
The OnGradientsReady event fires after the gradients of a Solver are ready for distribution to other ...
Definition: Solver.cs:126

MyCaffe.solvers.Solver.solver_rank
int solver_rank
Returns this Solver's rank in a multi-GPU session.
Definition: Solver.cs:1298

MyCaffe.solvers.Solver.Database
IXDatabaseBase Database
Returns the in-memory MyCaffeDatabase used.
Definition: Solver.cs:310

MyCaffe.solvers.Solver.Solve
virtual void Solve(int nIterationOverride=-1, byte[] rgWeights=null, byte[] rgState=null, TRAIN_STEP step=TRAIN_STEP.NONE)
The main entry of the solver function. In default, iter will be zero. Pass in a non-zero iter number ...
Definition: Solver.cs:744

MyCaffe.basecode
The MyCaffe.basecode contains all generic types used throughout MyCaffe.
Definition: Annotation.cs:12

MyCaffe.common
The MyCaffe.common namespace contains common MyCaffe classes.
Definition: BatchInput.cs:8

MyCaffe.common.DEVINIT
DEVINIT
Specifies the initialization flags used when initializing CUDA.
Definition: CudaDnn.cs:207

MyCaffe.common.NCCL_REDUCTION_OP
NCCL_REDUCTION_OP
Specifies the reduction operation to use with 'Nickel' NCCL.
Definition: CudaDnn.cs:513

MyCaffe.param
The MyCaffe.param namespace contains parameters used to create models.
Definition: AttentionParameter.cs:9

MyCaffe.solvers
The MyCaffe.solvers namespace contains all solver classes, including the base Solver.
Definition: AdaDeltaSolver.cs:13

MyCaffe
The MyCaffe namespace contains the main body of MyCaffe code that closesly tracks the C++ Caffe open-...
Definition: Annotation.cs:12

System
Definition: Component.cs:11