mycaffe/html/_neural_style_transfer_8cs_source.html

using MyCaffe.basecode;

using MyCaffe.common;

using MyCaffe.data;

using MyCaffe.layers;

using MyCaffe.layers.nt;

using MyCaffe.param;

using MyCaffe.param.nt;

using MyCaffe.solvers;

using System;

using System.Collections.Generic;

using System.Drawing;

using System.IO;

using System.Linq;

using System.Text;

using System.Threading.Tasks;


namespace MyCaffe.extras

{

    public class NeuralStyleTransfer<T> : IDisposable

    {

        CudaDnn<T> m_cuda;

        Log m_log;

        int m_nIterations = 1000;

        int m_nDisplayEvery = 100;                // vgg19 settings

        double m_dfTVLossWeight = 0;              // 0.01 to smooth out result -or- 0 to disable.

        double m_dfStyleDataScale1 = 0.0001;      // 0.0001

        double m_dfStyleDataScale2 = 1;           // 1

        double m_dfContentDataScale = 0.0001;     // 0.0001

        double m_dfContentLossScale = 0.0001;     // 0.0001 to 1 (larger make image granier)

        CancelEvent m_evtCancel;

        DataTransformer<T> m_transformer = null;

        TransformationParameter m_transformationParam;

        PersistCaffe<T> m_persist;

        NetParameter m_param;

        byte[] m_rgWeights = null;

        Dictionary<string, Dictionary<string, double>> m_rgLayers = new Dictionary<string, Dictionary<string, double>>();

        List<string> m_rgstrUsedLayers = new List<string>();

        List<double> m_rgMeanValues = new List<double>();

        SolverParameter.SolverType m_solverType = SolverParameter.SolverType.LBFGS;

        double m_dfLearningRate = 1.0;

        int m_nDefaultMaxImageSize = 840;

        string m_strDataBlobName = "data";

        Solver<T> m_solver = null;

        int m_nIntermediateOutput = 0;

        int m_nPartialIteration = 0;

        int m_nPartialIterations1 = 0;

        Net<T> m_netShare = null;

        bool m_bUsingSharedNet = false;

        int m_nLBFGSCorrections = 100;

        bool m_bAllowHalfSize = false;

        bool m_bAllowHalfSizeOnGram = true;

        bool m_bAllowHalfSizeOnEvent = true;

        bool m_bAllowHalfSizeOnLoss = true;

        bool m_bAllowHalfSizeOnScalar = true;

        long m_hWorkspaceData = 0;

        ulong m_lWorkspaceSizeInBytes = 0;


        public event EventHandler<NeuralStyleIntermediateOutputArgs> OnIntermediateOutput;


        public NeuralStyleTransfer(CudaDnn<T> cuda, Log log, CancelEvent evtCancel, string strModelType, string strModel, byte[] rgWeights, bool bCaffeModel, SolverParameter.SolverType solverType = SolverParameter.SolverType.LBFGS, double dfLearningRate = 1.5, int nLBFGSCorrections = 100, double dfDataScale = 1.0, Net<T> netShare = null)

        {

            evtCancel.Reset();


            m_log = log;

            m_evtCancel = evtCancel;

            m_rgWeights = rgWeights;

            m_solverType = solverType;

            m_dfLearningRate = dfLearningRate;

            m_nLBFGSCorrections = nLBFGSCorrections;


            setupNetShare(netShare, cuda);


            if (m_evtCancel != null)

                m_evtCancel.Reset();


            RawProto proto = RawProto.Parse(strModel);

            m_param = NetParameter.FromProto(proto);


            add_input_layer(m_param);

            m_rgstrUsedLayers = load_layers(strModelType);

            prune(m_param, m_rgstrUsedLayers);

            add_gram_layers(m_param);


            m_transformationParam = new TransformationParameter();

            m_transformationParam.color_order = (bCaffeModel) ? TransformationParameter.COLOR_ORDER.BGR : TransformationParameter.COLOR_ORDER.RGB;

            m_transformationParam.scale = dfDataScale;

            m_transformationParam.mean_value = m_rgMeanValues;


            m_persist = new PersistCaffe<T>(m_log, false);

        }


        public NeuralStyleTransfer(CudaDnn<T> cuda, Log log, CancelEvent evtCancel, Dictionary<string, Tuple<double, double>> rgLayers, string strModelDesc, byte[] rgWeights, bool bCaffeModel, SolverParameter.SolverType solverType = SolverParameter.SolverType.LBFGS, double dfLearningRate = 1.0, int nMaxImageSize = 840, int nLBFGSCorrections = 100, double dfDataScale = 1.0, Net<T> netShare = null)

        {

            m_log = log;

            m_evtCancel = evtCancel;

            m_rgWeights = rgWeights;

            m_solverType = solverType;

            m_dfLearningRate = dfLearningRate;

            m_nDefaultMaxImageSize = nMaxImageSize;

            m_nLBFGSCorrections = nLBFGSCorrections;


            setupNetShare(netShare, cuda);


            if (m_evtCancel != null)

                m_evtCancel.Reset();


            RawProto proto = RawProto.Parse(strModelDesc);

            m_param = NetParameter.FromProto(proto);


            Dictionary<string, double> rgStyle = new Dictionary<string, double>();

            Dictionary<string, double> rgContent = new Dictionary<string, double>();


            foreach (KeyValuePair<string, Tuple<double, double>> kv in rgLayers)

            {

                if (kv.Value.Item1 != 0)

                    rgStyle.Add(kv.Key, kv.Value.Item1);


                if (kv.Value.Item2 != 0)

                    rgContent.Add(kv.Key, kv.Value.Item2);

            }


            add_input_layer(m_param);

            m_rgstrUsedLayers = load_layers(rgStyle, rgContent);

            prune(m_param, m_rgstrUsedLayers);

            add_gram_layers(m_param);


            m_transformationParam = new TransformationParameter();

            m_transformationParam.color_order = (bCaffeModel) ? TransformationParameter.COLOR_ORDER.BGR : TransformationParameter.COLOR_ORDER.RGB;

            m_transformationParam.scale = dfDataScale;

            m_transformationParam.mean_value = m_rgMeanValues;


            m_persist = new PersistCaffe<T>(m_log, false);

        }


        public void Dispose()

        {

            m_evtCancel.Set();


            if (m_solver != null)

            {

                m_solver.Dispose();

                m_solver = null;

            }


            if (m_hWorkspaceData != 0)

            {

                m_cuda.FreeMemory(m_hWorkspaceData);

                m_hWorkspaceData = 0;

                m_lWorkspaceSizeInBytes = 0;

            }


            if (m_transformer != null)

            {

                m_transformer.Dispose();

                m_transformer = null;

            }

        }


        public void SetupHalfSize(bool bAllowHs, bool bAllowOnGram, bool bAllowOnEvent, bool bAllowOnLoss, bool bAllowOnScalar)

        {

            m_bAllowHalfSize = bAllowHs;

            m_bAllowHalfSizeOnEvent = bAllowOnEvent;

            m_bAllowHalfSizeOnGram = bAllowOnGram;

            m_bAllowHalfSizeOnLoss = bAllowOnLoss;

            m_bAllowHalfSizeOnScalar = bAllowOnScalar;


            if (!bAllowHs || !m_bAllowHalfSizeOnGram)

            {

                List<string> rgstrHalfLayers = new List<string>();


                foreach (LayerParameter layer1 in m_param.layer)

                {

                    if (layer1.use_halfsize)

                    {

                        if (layer1.name.Contains("gram"))

                            layer1.use_halfsize = false;

                        else

                            rgstrHalfLayers.Add(layer1.name);

                    }

                }


                if (!bAllowHs && rgstrHalfLayers.Count > 0)

                {

                    string strErr = "Half-sized memory not supported!  Disable half-size in the following layers: " + Utility.ToString<string>(rgstrHalfLayers);

                    m_log.FAIL(strErr);

                }

            }

        }


        private void setupNetShare(Net<T> net, CudaDnn<T> cuda)

        {

            if (net == null)

            {

                m_cuda = cuda;

                return;

            }


            int nNetDeviceId = net.Cuda.GetDeviceID();

            int nCudaDeviceId = cuda.GetDeviceID();


            if (nNetDeviceId != nCudaDeviceId)

            {

                m_cuda = cuda;

                return;

            }


            m_netShare = net;

            m_cuda = m_netShare.Cuda;

            m_bUsingSharedNet = true;


            return;

        }


        private void add_input_layer(NetParameter p)

        {

            List<int> rgDelIdx = new List<int>();

            LayerParameter data_param = null;

            LayerParameter input = null;


            for (int i = 0; i < p.layer.Count; i++)

            {

                if (p.layer[i].type == LayerParameter.LayerType.DATA)

                {

                    if (data_param == null)

                    {

                        data_param = p.layer[i];

                        m_strDataBlobName = data_param.top[0];

                    }


                    rgDelIdx.Add(i);

                }

                else if (p.layer[i].type == LayerParameter.LayerType.INPUT)

                {

                    input = p.layer[i];

                    m_strDataBlobName = input.top[0];

                }

            }


            for (int i = rgDelIdx.Count - 1; i >= 0; i--)

            {

                p.layer.RemoveAt(rgDelIdx[i]);

            }


            if (input == null)

            {

                input = new LayerParameter(LayerParameter.LayerType.INPUT);

                int nH = 224;

                int nW = 224;

                input.input_param.shape.Add(new BlobShape(1, 3, nH, nW));

                input.name = "input1";

                input.top.Add(m_strDataBlobName);


                p.layer.Insert(0, input);

            }

            else

            {

                input.name = "input1";

            }

        }


        private List<string> load_layers(string strName)

        {

            Dictionary<string, double> rgContent = new Dictionary<string, double>();

            Dictionary<string, double> rgStyle = new Dictionary<string, double>();


            switch (strName)

            {

                case "vgg19":

                case "vgg16":

                    rgContent.Add("conv4_2", 1);

                    rgStyle.Add("conv1_1", 0.2);

                    rgStyle.Add("conv2_1", 0.2);

                    rgStyle.Add("conv3_1", 0.2);

                    rgStyle.Add("conv4_1", 0.2);

                    rgStyle.Add("conv5_1", 0.2);

                    // mean is taken from gist.github.com/ksimonyan/3785162f95cd2d5fee77

                    m_rgMeanValues = new List<double>() { 103.939, 116.779, 123.68 };

                    break;


                case "googlenet":

                    rgContent.Add("conv2/3x3", 2e-4);

                    rgContent.Add("inception_3a/output", 1 - 2e-4);

                    rgStyle.Add("conv1/7x7_s2", 0.2);

                    rgStyle.Add("conv2/3x3", 0.2);

                    rgStyle.Add("inception_3a/output", 0.2);

                    rgStyle.Add("inception_4a/output", 0.2);

                    rgStyle.Add("inception_5a/output", 0.2);

                    m_rgMeanValues = new List<double>() { 104, 117, 123 };

                    break;


                case "caffenet":

                    rgContent.Add("conv4", 1);

                    rgStyle.Add("conv1", 0.2);

                    rgStyle.Add("conv2", 0.2);

                    rgStyle.Add("conv3", 0.2);

                    rgStyle.Add("conv4", 0.2);

                    rgStyle.Add("conv5", 0.2);

                    break;


                default:

                    throw new Exception("Model '" + strName + "' is not supported.");

            }


            return load_layers(rgStyle, rgContent);

        }


        private List<string> load_layers(Dictionary<string, double> rgStyle, Dictionary<string, double> rgContent)

        {

            m_rgLayers = new Dictionary<string, Dictionary<string, double>>();

            m_rgLayers.Add("content", rgContent);

            m_rgLayers.Add("style", rgStyle);


            List<string> rgstrUsedLayers = new List<string>();


            foreach (KeyValuePair<string, double> kv in rgContent)

            {

                rgstrUsedLayers.Add(kv.Key);

            }


            // Add the gram layers

            Dictionary<string, double> rgGram = new Dictionary<string, double>();

            foreach (KeyValuePair<string, double> kv in rgStyle)

            {

                rgstrUsedLayers.Add(kv.Key);

                rgGram.Add("gram_" + kv.Key, kv.Value);

            }


            m_rgLayers.Add("gram", rgGram);


            // Add the input layers

            Dictionary<string, double> rgInput = new Dictionary<string, double>();

            foreach (KeyValuePair<string, double> kv in rgContent)

            {

                rgInput.Add(kv.Key, kv.Value);

            }


            foreach (KeyValuePair<string, double> kv in rgGram)

            {

                rgInput.Add(kv.Key, kv.Value);

            }


            m_rgLayers.Add("input", rgInput);


            rgstrUsedLayers.Sort();


            return rgstrUsedLayers;

        }


        private void prune(NetParameter p, List<string> rgUsedLayers)

        {

            int nPruneFrom = -1;


            // We assume that all layers after the used layers are not useful.

            for (int i = 0; i < p.layer.Count; i++)

            {

                for (int j = 0; j < p.layer[i].top.Count; j++)

                {

                    bool bIsUsed = rgUsedLayers.Contains(p.layer[i].top[j]);


                    if (nPruneFrom >= 0 && bIsUsed)

                    {

                        nPruneFrom = -1;

                        break;

                    }

                    else if (nPruneFrom < 0 && !bIsUsed)

                    {

                        nPruneFrom = i;

                    }

                }

            }


            if (nPruneFrom >= 0)

            {

                for (int i = p.layer.Count - 1; i >= nPruneFrom; i--)

                {

                    m_log.WriteLine("Pruning layer '" + p.layer[i].name);

                    p.layer.RemoveAt(i);

                }

            }

        }


        private void add_gram_layers(NetParameter p)

        {

            List<KeyValuePair<string, double>> lstStyle = m_rgLayers["style"].ToList();

            List<KeyValuePair<string, double>> lstGram = m_rgLayers["gram"].ToList();


            for (int i=0; i<lstStyle.Count; i++)

            {

                bool bUseHalfSize = false;

                LayerParameter layer = new LayerParameter(LayerParameter.LayerType.GRAM);

                string strStyle = lstStyle[i].Key;

                string strGram = lstGram[i].Key;


                foreach (LayerParameter layer1 in p.layer)

                {

                    if (layer1.type == LayerParameter.LayerType.CONVOLUTION)

                    {

                        if (layer1.top.Contains(strStyle))

                        {

                            bUseHalfSize = layer1.use_halfsize;

                            break;

                        }

                    }

                }


                layer.name = strGram;


                layer.bottom.Add(strStyle);

                layer.top.Add(strGram);

                layer.gram_param.alpha = m_dfStyleDataScale1;

                layer.gram_param.disable_scaling_on_gradient = true;

                layer.gram_param.beta = m_dfStyleDataScale2;

                layer.use_halfsize = (bUseHalfSize && m_bAllowHalfSizeOnGram);


                p.layer.Add(layer);

            }

        }


        private double get_style_scale(Blob<T> b)

        {

            double df1 = b.shape(0);

            df1 = Math.Pow(df1, -2);

            double df2 = b.count(1);

            df2 = Math.Pow(df2, -2);


            double dfC = (df1 * df2);


            return dfC / 4;

        }


        private double get_content_scale(Blob<T> b)

        {

            return m_dfContentLossScale;

        }


        private void prepare_data_blob(Net<T> net, Bitmap bmp)

        {

            List<int> rgDataShape = new List<int>() { 1, 3, bmp.Height, bmp.Width };

            m_transformer = new DataTransformer<T>(m_cuda, m_log, m_transformationParam, Phase.TEST, 3, bmp.Height, bmp.Width);


            Blob<T> data = net.blob_by_name(m_strDataBlobName);

            data.Reshape(rgDataShape, data.HalfSize);

            data.mutable_cpu_data = m_transformer.Transform(ImageData.GetImageDataD(bmp, 3, false, -1));

        }


        private void prepare_input_param(Net<T> net, Bitmap bmp)

        {

            List<int> rgDataShape = new List<int>() { 1, 3, bmp.Height, bmp.Width };

            m_transformer = new DataTransformer<T>(m_cuda, m_log, m_transformationParam, Phase.TEST, 3, bmp.Height, bmp.Width);


            Blob<T> data = net.param_by_name("input1");

            data.Reshape(rgDataShape, data.HalfSize);

            data.mutable_cpu_data = m_transformer.Transform(ImageData.GetImageDataD(bmp, 3, false, -1));

        }


        private Bitmap save(Net<T> net)

        {

            Blob<T> blob = net.param_by_name("input1");

            Datum d = m_transformer.UnTransform(blob);

            return ImageData.GetImage(d);

        }


        public Bitmap Process(Bitmap bmpStyle, Bitmap bmpContent, int nIterations, int nIntermediateOutput = -1, double dfTvLoss = 0, int nMaxSize = -1, bool bEnablePartialSolution = false)

        {

            Solver<T> solver = null;

            Net<T> net = null;

            BlobCollection<T> colContentActivations = new BlobCollection<T>();

            BlobCollection<T> colGramActivations = new BlobCollection<T>();

            double dfLoss;

            bool bDone = true;


            try

            {

                m_dfTVLossWeight = dfTvLoss;

                m_nIterations = nIterations;


                if (nMaxSize == -1)

                    nMaxSize = m_nDefaultMaxImageSize;


                if (bmpContent.Width > nMaxSize ||

                    bmpContent.Height > nMaxSize)

                {

                    double dfAspectRatio = (double)bmpContent.Height / (double)bmpContent.Width;

                    int nWidth = nMaxSize;

                    int nHeight = (int)(nMaxSize * dfAspectRatio);

                    bmpContent = ImageTools.ResizeImage(bmpContent, nWidth, nHeight);

                }


                if (bmpStyle.Width != bmpContent.Width ||

                    bmpStyle.Height != bmpContent.Height)

                    bmpStyle = ImageTools.ResizeImage(bmpStyle, bmpContent.Width, bmpContent.Height);


                m_log.WriteLine("Creating input network...");

                m_log.Enable = false;

                net = new Net<T>(m_cuda, m_log, m_param, m_evtCancel, null, Phase.TEST, null, m_netShare, net_OnGetWorkspace, net_OnSetWorkspace);

                m_log.Enable = true;


                if (m_rgWeights != null && !m_bUsingSharedNet)

                    net.LoadWeights(m_rgWeights, m_persist);


                //-----------------------------------------

                //  Get style and content activations.

                //-----------------------------------------


                prepare_data_blob(net, bmpStyle);

                net.Forward(out dfLoss);


                foreach (KeyValuePair<string, double> kvGram in m_rgLayers["gram"])

                {

                    string strGram = kvGram.Key;

                    Blob<T> blobGram = net.blob_by_name(strGram);

                    colGramActivations.Add(blobGram.Clone());

                }


                prepare_data_blob(net, bmpContent);

                net.Forward(out dfLoss);


                foreach (KeyValuePair<string, double> kvContent in m_rgLayers["content"])

                {

                    string strContent = kvContent.Key;

                    Blob<T> blobContent = net.blob_by_name(strContent);

                    colContentActivations.Add(blobContent.Clone());

                }


                //-----------------------------------------

                //  Prepare the network by adding new layers.

                //-----------------------------------------


                NetParameter net_param = m_param;


                foreach (KeyValuePair<string, double> kvInput in m_rgLayers["input"])

                {

                    string strName = kvInput.Key;

                    LayerParameter p = new LayerParameter(LayerParameter.LayerType.INPUT);

                    p.name = "input_" + strName;

                    p.top.Add(p.name);


                    Blob<T> blob = net.blob_by_name(strName);

                    p.input_param.shape.Add(new BlobShape(blob.shape()));

                    p.use_halfsize = blob.HalfSize;


                    net_param.layer.Add(p);

                }


                foreach (KeyValuePair<string, double> kvContent in m_rgLayers["content"])

                {

                    string strName = kvContent.Key;

                    string strScale1 = "input_" + strName;

                    string strScale2 = strName;

                    Blob<T> blobContent = colContentActivations[strName];


                    if (m_dfContentDataScale != 1.0)

                    {

                        strScale1 += "b";

                        LayerParameter ps1 = new LayerParameter(LayerParameter.LayerType.SCALAR);

                        ps1.scalar_param.value = m_dfContentDataScale;

                        ps1.scalar_param.operation = ScalarParameter.ScalarOp.MUL;

                        ps1.scalar_param.passthrough_gradient = true;

                        ps1.use_halfsize = (blobContent.HalfSize && m_bAllowHalfSizeOnScalar);

                        ps1.bottom.Add("input_" + strName);

                        ps1.top.Add(strScale1);


                        net_param.layer.Add(ps1);


                        strScale2 += "b";

                        LayerParameter ps2 = new LayerParameter(LayerParameter.LayerType.SCALAR);

                        ps2.scalar_param.value = m_dfContentDataScale;

                        ps2.scalar_param.operation = ScalarParameter.ScalarOp.MUL;

                        ps2.scalar_param.passthrough_gradient = true;

                        ps2.use_halfsize = (blobContent.HalfSize && m_bAllowHalfSizeOnScalar);

                        ps2.bottom.Add(strName);

                        ps2.top.Add(strScale2);


                        net_param.layer.Add(ps2);

                    }


                    LayerParameter event_param = new LayerParameter(LayerParameter.LayerType.EVENT);

                    event_param.name = "event_" + strName;

                    event_param.bottom.Add(strScale2);

                    event_param.bottom.Add(strScale1);

                    event_param.use_halfsize = (blobContent.HalfSize && m_bAllowHalfSizeOnEvent);

                    event_param.top.Add("event_" + strName);


                    net_param.layer.Add(event_param);


                    LayerParameter p = new LayerParameter(LayerParameter.LayerType.EUCLIDEAN_LOSS);

                    p.name = "loss_" + strName;


                    double dfScale = get_content_scale(blobContent);

                    p.loss_weight.Add(kvContent.Value * dfScale);

                    p.use_halfsize = (blobContent.HalfSize && m_bAllowHalfSizeOnLoss);

                    p.bottom.Add("event_" + strName);

                    p.bottom.Add(strScale1);

                    p.top.Add("loss_" + strName);


                    net_param.layer.Add(p);

                }


                foreach (KeyValuePair<string, double> kvGram in m_rgLayers["gram"].ToList())

                {

                    string strGramName = kvGram.Key;

                    Blob<T> blobGram = colGramActivations[strGramName];


                    LayerParameter event_param = new LayerParameter(LayerParameter.LayerType.EVENT);

                    event_param.name = "event_" + strGramName;

                    event_param.use_halfsize = (blobGram.HalfSize && m_bAllowHalfSizeOnEvent);

                    event_param.bottom.Add(strGramName);

                    event_param.bottom.Add("input_" + strGramName);

                    event_param.top.Add("event_" + strGramName);


                    net_param.layer.Add(event_param);


                    LayerParameter p = new LayerParameter(LayerParameter.LayerType.EUCLIDEAN_LOSS);

                    p.name = "loss_" + strGramName;

                    p.use_halfsize = (blobGram.HalfSize && m_bAllowHalfSizeOnLoss);


                    double dfScale = get_style_scale(blobGram);

                    p.loss_weight.Add(kvGram.Value * dfScale);


                    p.bottom.Add("input_" + strGramName);

                    p.bottom.Add("event_" + strGramName);

                    p.top.Add("loss_" + strGramName);


                    net_param.layer.Add(p);

                }


                // Add TV Loss;

                if (m_dfTVLossWeight != 0)

                {

                    LayerParameter p = new LayerParameter(LayerParameter.LayerType.TV_LOSS);

                    p.name = "loss_tv";


                    double dfWeight = m_dfTVLossWeight;

                    p.loss_weight.Add(dfWeight);


                    p.bottom.Add(m_strDataBlobName);

                    p.top.Add("loss_tv");


                    net_param.layer.Add(p);

                }


                // Replace InputLayer with ParameterLayer,

                // so that we'll be able to backprop into the image.

                Blob<T> data = net.blob_by_name(m_strDataBlobName);

                for (int i=0; i<net_param.layer.Count; i++)

                {

                    LayerParameter p = net_param.layer[i];


                    if (p.name == "input1")

                    {

                        net_param.layer[i].SetType(LayerParameter.LayerType.PARAMETER);

                        net_param.layer[i].parameter_param.shape = new BlobShape(data.shape());

                        break;

                    }

                }


                // Disable weights learning.

                List<LayerParameter.LayerType> rgTypes = new List<LayerParameter.LayerType>();

                rgTypes.Add(LayerParameter.LayerType.CONVOLUTION);

                rgTypes.Add(LayerParameter.LayerType.DECONVOLUTION);

                rgTypes.Add(LayerParameter.LayerType.INNERPRODUCT);

                rgTypes.Add(LayerParameter.LayerType.PRELU);

                rgTypes.Add(LayerParameter.LayerType.BIAS);

                rgTypes.Add(LayerParameter.LayerType.EMBED);

                rgTypes.Add(LayerParameter.LayerType.LSTM);

                rgTypes.Add(LayerParameter.LayerType.LSTM_ATTENTION);

                rgTypes.Add(LayerParameter.LayerType.LSTM_SIMPLE);  // DEPRECIATED

                rgTypes.Add(LayerParameter.LayerType.RNN);


                foreach (LayerParameter layer in net_param.layer)

                {

                    if (rgTypes.Contains(layer.type))

                    {

                        layer.parameters = new List<ParamSpec>();

                        layer.parameters.Add(new ParamSpec(0, 0));

                        layer.parameters.Add(new ParamSpec(0, 0));

                    }

                }


                net.Dispose();

                net = null;


                //-----------------------------------------

                //  Create solver and assign inputs.

                //-----------------------------------------


                SolverParameter solver_param = new SolverParameter();

                solver_param.display = m_nDisplayEvery;

                solver_param.train_net_param = net_param;

                solver_param.test_iter.Clear();

                solver_param.test_interval = 0;

                solver_param.test_initialization = false;

                solver_param.base_lr = m_dfLearningRate;

                solver_param.type = m_solverType;

                solver_param.lbgfs_corrections = m_nLBFGSCorrections;


                m_log.WriteLine("Creating " + m_solverType.ToString() + " solver with learning rate = " + m_dfLearningRate.ToString() + "...");

                m_log.Enable = false;


                if (m_solverType == SolverParameter.SolverType.LBFGS)

                    solver = new LBFGSSolver<T>(m_cuda, m_log, solver_param, m_evtCancel, null, null, null, m_persist, 1, 0, m_netShare, net_OnGetWorkspace, net_OnSetWorkspace);

                else

                    solver = Solver<T>.Create(m_cuda, m_log, solver_param, m_evtCancel, null, null, null, m_persist, 1, 0, m_netShare, net_OnGetWorkspace, net_OnSetWorkspace);


                m_log.Enable = true;

                solver.OnSnapshot += Solver_OnSnapshot;

                solver.OnTrainingIteration += Solver_OnTrainingIteration;


                foreach (Layer<T> layer in solver.net.layers)

                {

                    if (layer.type == LayerParameter.LayerType.EVENT)

                    {

                        EventLayer<T> eventLayer = layer as EventLayer<T>;

                        eventLayer.OnBackward += EventLayer_OnBackward;

                    }

                }


                prepare_input_param(solver.net, bmpContent);


                foreach (KeyValuePair<string, double> kvContent in m_rgLayers["content"])

                {

                    string strName = kvContent.Key;

                    Blob<T> blobDst = solver.net.blob_by_name("input_" + strName);

                    Blob<T> blobSrc = colContentActivations[strName];

                    blobDst.CopyFrom(blobSrc);

                }


                foreach (KeyValuePair<string, double> kvGram in m_rgLayers["gram"])

                {

                    string strName = kvGram.Key;

                    Blob<T> blobDst = solver.net.blob_by_name("input_" + strName);

                    Blob<T> blobSrc = colGramActivations[strName];

                    blobDst.CopyFrom(blobSrc);

                }


                colGramActivations.Dispose();

                colGramActivations = null;


                colContentActivations.Dispose();

                colContentActivations = null;


                //-----------------------------------------

                //  Optimize.

                //-----------------------------------------


                if (nIntermediateOutput <= 0 || nIntermediateOutput == m_nIterations)

                {

                    bEnablePartialSolution = false;

                    nIntermediateOutput = m_nIterations;

                }


                int nIterations1 = m_nIterations / nIntermediateOutput;


                if (m_rgWeights != null && !m_bUsingSharedNet)

                {

                    Blob<T> blobInput = solver.net.learnable_parameters[0];

                    solver.net.learnable_parameters.RemoveAt(0);

                    solver.net.LoadWeights(m_rgWeights, m_persist);

                    solver.net.learnable_parameters.Insert(0, blobInput);

                }


                if (bEnablePartialSolution)

                {

                    m_solver = solver;

                    m_nPartialIteration = 0;

                    m_nPartialIterations1 = nIterations1;

                    m_nIntermediateOutput = nIntermediateOutput;

                    bDone = false;

                    return null;

                }


                for (int i = 0; i < nIterations1; i++)

                {

                    if (m_evtCancel.WaitOne(0))

                        break;


                    solver.Step(nIntermediateOutput, TRAIN_STEP.NONE, true, true, true);


                    if (!m_evtCancel.WaitOne(0))

                    {

                        if (OnIntermediateOutput != null && nIntermediateOutput > 0 && i < nIterations1 - 1)

                        {

                            Bitmap bmpTemp = save(solver.net);

                            double dfPct = (double)i / (double)nIterations1;

                            OnIntermediateOutput(this, new NeuralStyleIntermediateOutputArgs(i, bmpTemp, dfPct));

                            bmpTemp.Dispose();

                        }

                    }

                }


                return save(solver.net);

            }

            catch (Exception excpt)

            {

                if (solver != null)

                {

                    m_solver = null;

                    solver.Dispose();

                }


                throw excpt;

            }

            finally

            {

                if (net != null)

                    net.Dispose();


                if (colGramActivations != null)

                    colGramActivations.Dispose();


                if (colContentActivations != null)

                    colContentActivations.Dispose();


                if (bDone)

                {

                    if (solver != null)

                        solver.Dispose();

                }

            }

        }


        private void net_OnSetWorkspace(object sender, WorkspaceArgs e)

        {

            if (e.WorkspaceSizeInBytes < m_lWorkspaceSizeInBytes || e.WorkspaceSizeInBytes == 0)

                return;


            m_lWorkspaceSizeInBytes = e.WorkspaceSizeInBytes;

            m_cuda.DisableGhostMemory();


            if (m_hWorkspaceData != 0)

                m_cuda.FreeMemory(m_hWorkspaceData);


            m_hWorkspaceData = m_cuda.AllocMemory((long)m_lWorkspaceSizeInBytes);


            m_cuda.ResetGhostMemory();

        }


        private void net_OnGetWorkspace(object sender, WorkspaceArgs e)

        {

            e.WorkspaceData = m_hWorkspaceData;

            e.WorkspaceSizeInBytes = m_lWorkspaceSizeInBytes;

        }


        public Bitmap ProcessNext(out Bitmap bmpIntermediate, out int nIntermediateIdx)

        {

            try

            {

                bmpIntermediate = null;

                nIntermediateIdx = m_nPartialIteration * m_nIntermediateOutput;


                if (m_solver == null)

                    throw new Exception("To run the next in process, the solver cannot be null!  You must call Process first.");


                m_solver.Step(m_nIntermediateOutput, TRAIN_STEP.NONE, true, true, true);


                if (m_evtCancel.WaitOne(0))

                    return null;


                m_nPartialIteration++;


                if (m_nIntermediateOutput > 0 && m_nPartialIteration < m_nPartialIterations1)

                {

                    bmpIntermediate = save(m_solver.net);


                    if (OnIntermediateOutput != null)

                    {

                        double dfPct = (double)m_nPartialIteration / (double)m_nPartialIterations1;

                        OnIntermediateOutput(this, new NeuralStyleIntermediateOutputArgs(m_nPartialIteration * m_nIntermediateOutput, bmpIntermediate, dfPct));

                    }

                }


                if (m_nPartialIteration < m_nPartialIterations1)

                    return null;


                return save(m_solver.net);

            }

            catch (Exception excpt)

            {

                throw excpt;

            }

            finally

            {

                if (m_nPartialIteration == m_nPartialIterations1)

                {

                    if (m_solver != null)

                    {

                        m_solver.Dispose();

                        m_solver = null;

                    }

                }

            }

        }


        private void EventLayer_OnBackward(object sender, BackwardArgs<T> e)

        {

            int nCount = e.BottomVec[0].count();

            long hTopDiff0 = e.TopVec[0].mutable_gpu_diff;

            long hBottomData1 = e.BottomVec[1].gpu_data;

            long hBottomDiff1 = e.BottomVec[1].mutable_gpu_diff;

            long hBottomDiff = e.BottomVec[0].mutable_gpu_diff;


            m_cuda.sign(nCount, hBottomData1, hBottomDiff1);

            m_cuda.abs(nCount, hBottomDiff1, hBottomDiff1);

            m_cuda.mul(nCount, hBottomDiff1, hTopDiff0, hBottomDiff);

        }


        private void Solver_OnTrainingIteration(object sender, TrainingIterationArgs<T> e)

        {

            m_log.WriteLine("Iteration = " + e.Iteration.ToString() + " - Loss = " + e.SmoothedLoss.ToString());


            if (double.IsNaN(e.Loss))

            {

                m_evtCancel.Set();

                m_log.FAIL("Loss = NAN!");

                return;

            }


            if (double.IsInfinity(e.Loss))

            {

                m_evtCancel.Set();

                m_log.FAIL("Loss = Infinity!");

                return;

            }

        }


        private void Solver_OnSnapshot(object sender, SnapshotArgs e)

        {

        }


        public static string CreateConfigurationString(string strSolver, double dfLearningRate, int nMaxImageSize, int nIterations, int nIntermediateIterations, Dictionary<string, Tuple<double, double>> rgWts, List<int> rgGpuID, int nLBFGSCorrections, double dfDataScale, bool bAllowHs, bool bAllowHsGram, bool bAllowHsEvent, bool bAllowHsScalar, bool bAllowHsLoss)

        {

            RawProtoCollection rgChildren = new RawProtoCollection();


            rgChildren.Add("solver", strSolver);

            rgChildren.Add("learning_rate", dfLearningRate);

            rgChildren.Add("max_image_size", nMaxImageSize);

            rgChildren.Add("iterations", nIterations);

            rgChildren.Add("intermediate_iterations", nIntermediateIterations);


            RawProtoCollection rgLayerWt = new RawProtoCollection();

            foreach (KeyValuePair<string, Tuple<double, double>> kv in rgWts)

            {

                RawProtoCollection layer = new RawProtoCollection();

                layer.Add("name", kv.Key);

                layer.Add("style_wt", kv.Value.Item1);

                layer.Add("content_wt", kv.Value.Item2);


                rgLayerWt.Add(new RawProto("layer", "", layer));

            }


            rgChildren.Add(rgLayerWt);


            RawProtoCollection gpus = new RawProtoCollection();

            foreach (int nGpuID in rgGpuID)

            {

                gpus.Add("gpuid", nGpuID.ToString());

            }


            rgChildren.Add(gpus);

            rgChildren.Add("lbfgs_corrections", nLBFGSCorrections);

            rgChildren.Add("data_scale", dfDataScale);

            rgChildren.Add("allow_hs", bAllowHs);

            rgChildren.Add("allow_hs_gram", bAllowHsGram);

            rgChildren.Add("allow_hs_event", bAllowHsEvent);

            rgChildren.Add("allow_hs_scalar", bAllowHsScalar);

            rgChildren.Add("allow_hs_loss", bAllowHsLoss);


            RawProto proto = new RawProto("root", "", rgChildren);


            return proto.ToString();

        }


        public static Dictionary<string, Tuple<double, double>> ParseConfigurationString(string strConfig, out string strSolver, out double dfLearningRate, out int nMaxImageSize, out int nIterations, out int nIntermediateIterations, out List<int> rgGpuID, out int nLBFGSCorrections, out double dfDataScale, out bool bAllowHs, out bool bAllowHsGram, out bool bAllowHsEvent, out bool bAllowHsScalar, out bool bAllowHsLoss)

        {

            RawProto proto = RawProto.Parse(strConfig);

            string strVal;


            strSolver = null;

            if ((strVal = proto.FindValue("solver")) != null)

                strSolver = strVal;


            dfLearningRate = 0;

            if ((strVal = proto.FindValue("learning_rate")) != null)

                dfLearningRate = BaseParameter.ParseDouble(strVal);


            nMaxImageSize = 0;

            if ((strVal = proto.FindValue("max_image_size")) != null)

                nMaxImageSize = int.Parse(strVal);


            nIterations = 1000;

            if ((strVal = proto.FindValue("iterations")) != null)

                nIterations = int.Parse(strVal);


            nIntermediateIterations = 0;

            if ((strVal = proto.FindValue("intermediate_iterations")) != null)

                nIntermediateIterations = int.Parse(strVal);


            Dictionary<string, Tuple<double, double>> rgLayers = new Dictionary<string, Tuple<double, double>>();

            RawProtoCollection style = proto.FindChildren("layer");

            foreach (RawProto styleProto in style)

            {

                string strLayer = null;

                if ((strVal = styleProto.FindValue("name")) != null)

                    strLayer = strVal;


                double dfSWt = 0;

                if ((strVal = styleProto.FindValue("style_wt")) != null)

                    dfSWt = BaseParameter.ParseDouble(strVal);


                double dfCWt = 0;

                if ((strVal = styleProto.FindValue("content_wt")) != null)

                    dfCWt = BaseParameter.ParseDouble(strVal);


                rgLayers.Add(strLayer, new Tuple<double, double>(dfSWt, dfCWt));

            }


            rgGpuID = new List<int>();

            RawProtoCollection gpus = proto.FindChildren("gpuid");

            foreach (RawProto gpuProto in gpus)

            {

                rgGpuID.Add(int.Parse(gpuProto.Value));

            }


            nLBFGSCorrections = 100;

            if ((strVal = proto.FindValue("lbfgs_corrections")) != null)

                nLBFGSCorrections = int.Parse(strVal);


            dfDataScale = 1.0;

            if ((strVal = proto.FindValue("data_scale")) != null)

                dfDataScale = BaseParameter.ParseDouble(strVal);


            bAllowHs = false;

            if ((strVal = proto.FindValue("allow_hs")) != null)

                bAllowHs = bool.Parse(strVal);


            bAllowHsGram = true;

            if ((strVal = proto.FindValue("allow_hs_gram")) != null)

                bAllowHsGram = bool.Parse(strVal);


            bAllowHsEvent = true;

            if ((strVal = proto.FindValue("allow_hs_event")) != null)

                bAllowHsEvent = bool.Parse(strVal);


            bAllowHsScalar = true;

            if ((strVal = proto.FindValue("allow_hs_scalar")) != null)

                bAllowHsScalar = bool.Parse(strVal);


            bAllowHsLoss = true;

            if ((strVal = proto.FindValue("allow_hs_loss")) != null)

                bAllowHsLoss = bool.Parse(strVal);


            return rgLayers;

        }

    }


    public class NeuralStyleIntermediateOutputArgs : EventArgs

    {

        Bitmap m_img;

        int m_nIteration;

        double m_dfPercent;


        public NeuralStyleIntermediateOutputArgs(int nIteration, Bitmap bmp, double dfPct)

        {

            m_nIteration = nIteration;

            m_img = bmp;

            m_dfPercent = dfPct;

        }


        public int Iteration

        {

            get { return m_nIteration; }

        }


        public Bitmap Image

        {

            get { return m_img; }

        }


        public double Percent

        {

            get { return m_dfPercent; }

        }

    }

}

MyCaffe.basecode.BaseParameter
The BaseParameter class is the base class for all other parameter classes.
Definition: BaseParameter.cs:18

MyCaffe.basecode.BaseParameter.ParseDouble
static double ParseDouble(string strVal)
Parse double values using the US culture if the decimal separator = '.', then using the native cultur...
Definition: BaseParameter.cs:35

MyCaffe.basecode.CancelEvent
The CancelEvent provides an extension to the manual cancel event that allows for overriding the manua...
Definition: CancelEvent.cs:17

MyCaffe.basecode.CancelEvent.Reset
void Reset()
Resets the event clearing any signaled state.
Definition: CancelEvent.cs:279

MyCaffe.basecode.CancelEvent.WaitOne
bool WaitOne(int nMs=int.MaxValue)
Waits for the signal state to occur.
Definition: CancelEvent.cs:290

MyCaffe.basecode.CancelEvent.Set
void Set()
Sets the event to the signaled state.
Definition: CancelEvent.cs:270

MyCaffe.basecode.Datum
The Datum class is a simple wrapper to the SimpleDatum class to ensure compatibility with the origina...
Definition: Datum.cs:12

MyCaffe.basecode.ImageData
The ImageData class is a helper class used to convert between Datum, other raw data,...
Definition: ImageData.cs:14

MyCaffe.basecode.ImageData.GetImage
static Bitmap GetImage(SimpleDatum d, ColorMapper clrMap=null, List< int > rgClrOrder=null)
Converts a SimplDatum (or Datum) into an image, optionally using a ColorMapper.
Definition: ImageData.cs:506

MyCaffe.basecode.ImageData.GetImageDataD
static Datum GetImageDataD(Bitmap bmp, int nChannels, bool bDataIsReal, int nLabel, bool bUseLockBitmap=true, int[] rgFocusMap=null)
The GetImageDataD function converts a Bitmap into a Datum using the double type for real data.
Definition: ImageData.cs:44

MyCaffe.basecode.ImageTools
The ImageTools class is a helper class used to manipulate image data.
Definition: ImageTools.cs:16

MyCaffe.basecode.ImageTools.ResizeImage
static Bitmap ResizeImage(Image image, int width, int height)
Resize the image to the specified width and height.
Definition: ImageTools.cs:39

MyCaffe.basecode.Log
The Log class provides general output in text form.
Definition: Log.cs:13

MyCaffe.basecode.Log.WriteLine
void WriteLine(string str, bool bOverrideEnabled=false, bool bHeader=false, bool bError=false, bool bDisable=false)
Write a line of output.
Definition: Log.cs:80

MyCaffe.basecode.Log.Enable
bool Enable
Enables/disables the Log. When disabled, the Log does not output any data.
Definition: Log.cs:42

MyCaffe.basecode.Log.FAIL
void FAIL(string str)
Causes a failure which throws an exception with the desciptive text.
Definition: Log.cs:394

MyCaffe.basecode.RawProtoCollection
The RawProtoCollection class is a list of RawProto objects.
Definition: RawProtoCollection.cs:12

MyCaffe.basecode.RawProtoCollection.Add
void Add(RawProto p)
Adds a RawProto to the collection.
Definition: RawProtoCollection.cs:55

MyCaffe.basecode.RawProto
The RawProto class is used to parse and output Google prototxt file data.
Definition: RawProto.cs:17

MyCaffe.basecode.RawProto.Value
string Value
Get/set the value of the node.
Definition: RawProto.cs:79

MyCaffe.basecode.RawProto.ToString
override string ToString()
Returns the RawProto as its full prototxt string.
Definition: RawProto.cs:681

MyCaffe.basecode.RawProto.Parse
static RawProto Parse(string str)
Parses a prototxt and places it in a new RawProto.
Definition: RawProto.cs:306

MyCaffe.basecode.RawProto.FindValue
string FindValue(string strName)
Searches for a falue of a node within this nodes children.
Definition: RawProto.cs:105

MyCaffe.basecode.RawProto.FindChildren
RawProtoCollection FindChildren(params string[] rgstrName)
Searches for all children with a given name in this node's children.
Definition: RawProto.cs:263

MyCaffe.basecode.Utility
The Utility class provides general utility funtions.
Definition: Utility.cs:35

MyCaffe.common.BackwardArgs
The BackwardArgs are passed to the OnBackward event of the EventLayer.
Definition: EventArgs.cs:703

MyCaffe.common.BlobCollection
The BlobCollection contains a list of Blobs.
Definition: BlobCollection.cs:16

MyCaffe.common.BlobCollection.Dispose
void Dispose()
Release all resource used by the collection and its Blobs.
Definition: BlobCollection.cs:542

MyCaffe.common.BlobCollection.Add
void Add(Blob< T > b)
Add a new Blob to the collection.
Definition: BlobCollection.cs:92

MyCaffe.common.Blob
The Blob is the main holder of data that moves through the Layers of the Net.
Definition: Blob.cs:25

MyCaffe.common.Blob.HalfSize
bool HalfSize
Returns whether or not this blob is using half sizes.
Definition: Blob.cs:369

MyCaffe.common.Blob.mutable_cpu_data
T[] mutable_cpu_data
Get data from the GPU and bring it over to the host, or Set data from the Host and send it over to th...
Definition: Blob.cs:1461

MyCaffe.common.Blob.Clone
Blob< T > Clone()
Copies the Blob, including its data and diff.
Definition: Blob.cs:2202

MyCaffe.common.Blob.Reshape
void Reshape(int nNum, int nChannels, int nHeight, int nWidth, bool? bUseHalfSize=null)
DEPRECIATED; use
Definition: Blob.cs:442

MyCaffe.common.Blob.CopyFrom
void CopyFrom(Blob< T > src, int nSrcOffset, int nDstOffset, int nCount, bool bCopyData, bool bCopyDiff)
Copy from a source Blob.
Definition: Blob.cs:903

MyCaffe.common.Blob.shape
List< int > shape()
Returns an array where each element contains the shape of an axis of the Blob.
Definition: Blob.cs:684

MyCaffe.common.Blob.count
int count()
Returns the total number of items in the Blob.
Definition: Blob.cs:739

MyCaffe.common.CudaDnn
The CudaDnn object is the main interface to the Low-Level Cuda C++ DLL.
Definition: CudaDnn.cs:969

MyCaffe.common.CudaDnn.GetDeviceID
int GetDeviceID()
Returns the current device id set within Cuda.
Definition: CudaDnn.cs:2013

MyCaffe.common.ForwardArgs.BottomVec
BlobCollection< T > BottomVec
Returns the bottom blobs.
Definition: EventArgs.cs:685

MyCaffe.common.ForwardArgs.TopVec
BlobCollection< T > TopVec
Returns the top blobs.
Definition: EventArgs.cs:693

MyCaffe.common.Net
Connects Layer's together into a direct acrylic graph (DAG) specified by a NetParameter
Definition: Net.cs:23

MyCaffe.common.Net.Forward
BlobCollection< T > Forward()
Run forward with the input Blob's already fed separately.
Definition: Net.cs:1445

MyCaffe.common.Net.Dispose
virtual void Dispose(bool bDisposing)
Releases all resources (GPU and Host) used by the Net.
Definition: Net.cs:184

MyCaffe.common.Net.LoadWeights
void LoadWeights(byte[] rgWeights, IXPersist< T > persist, List< string > inputWtInfo=null, List< string > targetWtInfo=null, string strSkipBlobType=null)
Loads new weights into the Net.
Definition: Net.cs:2510

MyCaffe.common.Net.param_by_name
Blob< T > param_by_name(string strName, bool bThrowExceptionOnError=true)
Returns a parameter given its name.
Definition: Net.cs:2167

MyCaffe.common.Net.blob_by_name
Blob< T > blob_by_name(string strName, bool bThrowExceptionOnError=true)
Returns a blob given its name.
Definition: Net.cs:2245

MyCaffe.common.Net.Cuda
CudaDnn< T > Cuda
Returns the instance of CudaDnn used by this network.
Definition: Net.cs:2821

MyCaffe.common.PersistCaffe
The PersistCaffe class is used to load and save weight files in the .caffemodel format.
Definition: PersistCaffe.cs:20

MyCaffe.common.SnapshotArgs
The SnapshotArgs is sent to the Solver::OnSnapshot event which fires each time the Solver::Snapshot m...
Definition: EventArgs.cs:416

MyCaffe.common.TestingIterationArgs.Iteration
int Iteration
Return the iteration of the test cycle.
Definition: EventArgs.cs:246

MyCaffe.common.TrainingIterationArgs
The TrainingIterationArgs is sent to the Solver::OnTrainingIteration event that fires at the end of a...
Definition: EventArgs.cs:264

MyCaffe.common.TrainingIterationArgs.Loss
double Loss
Returns the loss of the training cycle.
Definition: EventArgs.cs:311

MyCaffe.common.TrainingIterationArgs.SmoothedLoss
double SmoothedLoss
Retunrs the average loss after the training cycle.
Definition: EventArgs.cs:319

MyCaffe.common.WorkspaceArgs
The WorkspaceArgs are passed to both the Layer::OnSetWorkspace and Layer::OnGetWorkspace events.
Definition: EventArgs.cs:17

MyCaffe.common.WorkspaceArgs.WorkspaceData
long WorkspaceData
Get/set the handle to workspace data in GPU memory.
Definition: EventArgs.cs:36

MyCaffe.common.WorkspaceArgs.WorkspaceSizeInBytes
ulong WorkspaceSizeInBytes
Get/set the workspace memory size in bytes.
Definition: EventArgs.cs:45

MyCaffe.data.DataTransformer
Applies common transformations to the input data, such as scaling, mirroring, subtracting the image m...
Definition: DataTransformer.cs:23

MyCaffe.data.DataTransformer.UnTransform
Datum UnTransform(Blob< T > blob, bool bIncludeMean=true)
Reverse the transformation made when calling Transform.
Definition: DataTransformer.cs:1379

MyCaffe.data.DataTransformer.Dispose
void Dispose()
Cleanup all resources used.
Definition: DataTransformer.cs:81

MyCaffe.data.DataTransformer.Transform
void Transform(List< Datum > rgDatum, Blob< T > blobTransformed, CudaDnn< T > cuda, Log log)
Transforms a list of Datum and places the transformed data into a Blob.
Definition: DataTransformer.cs:373

MyCaffe.extras.NeuralStyleIntermediateOutputArgs
The NeuralStyleIntermediateOutputArgs contains the arguments sent to the OnIntermediateOutput event.
Definition: NeuralStyleTransfer.cs:1172

MyCaffe.extras.NeuralStyleIntermediateOutputArgs.Image
Bitmap Image
Returns the current intermediate image.
Definition: NeuralStyleTransfer.cs:1202

MyCaffe.extras.NeuralStyleIntermediateOutputArgs.NeuralStyleIntermediateOutputArgs
NeuralStyleIntermediateOutputArgs(int nIteration, Bitmap bmp, double dfPct)
The constructor.
Definition: NeuralStyleTransfer.cs:1183

MyCaffe.extras.NeuralStyleIntermediateOutputArgs.Percent
double Percent
Returns the total processing progress.
Definition: NeuralStyleTransfer.cs:1210

MyCaffe.extras.NeuralStyleIntermediateOutputArgs.Iteration
int Iteration
Returns the current interation.
Definition: NeuralStyleTransfer.cs:1194

MyCaffe.extras.NeuralStyleTransfer
The NeuralStyleTransfer object uses the GramLayer, TVLossLayer and LBFGSSolver to perform the neural ...
Definition: NeuralStyleTransfer.cs:31

MyCaffe.extras.NeuralStyleTransfer.OnIntermediateOutput
EventHandler< NeuralStyleIntermediateOutputArgs > OnIntermediateOutput
Specifies the event fired after producing intermediate output (e.g. when m_nIntermediateOutput > 0)
Definition: NeuralStyleTransfer.cs:72

MyCaffe.extras.NeuralStyleTransfer.CreateConfigurationString
static string CreateConfigurationString(string strSolver, double dfLearningRate, int nMaxImageSize, int nIterations, int nIntermediateIterations, Dictionary< string, Tuple< double, double > > rgWts, List< int > rgGpuID, int nLBFGSCorrections, double dfDataScale, bool bAllowHs, bool bAllowHsGram, bool bAllowHsEvent, bool bAllowHsScalar, bool bAllowHsLoss)
The CreateConfigurationString function packs all deep draw settings into a configuration string.
Definition: NeuralStyleTransfer.cs:1024

MyCaffe.extras.NeuralStyleTransfer.NeuralStyleTransfer
NeuralStyleTransfer(CudaDnn< T > cuda, Log log, CancelEvent evtCancel, Dictionary< string, Tuple< double, double > > rgLayers, string strModelDesc, byte[] rgWeights, bool bCaffeModel, SolverParameter.SolverType solverType=SolverParameter.SolverType.LBFGS, double dfLearningRate=1.0, int nMaxImageSize=840, int nLBFGSCorrections=100, double dfDataScale=1.0, Net< T > netShare=null)
The constructor.
Definition: NeuralStyleTransfer.cs:137

MyCaffe.extras.NeuralStyleTransfer.Process
Bitmap Process(Bitmap bmpStyle, Bitmap bmpContent, int nIterations, int nIntermediateOutput=-1, double dfTvLoss=0, int nMaxSize=-1, bool bEnablePartialSolution=false)
Process the content image by applying the style to it that was learned from the style image.
Definition: NeuralStyleTransfer.cs:530

MyCaffe.extras.NeuralStyleTransfer.SetupHalfSize
void SetupHalfSize(bool bAllowHs, bool bAllowOnGram, bool bAllowOnEvent, bool bAllowOnLoss, bool bAllowOnScalar)
Setup which layers are allowed to use half-sized memory when their convolution counterparts use it.
Definition: NeuralStyleTransfer.cs:215

MyCaffe.extras.NeuralStyleTransfer.ProcessNext
Bitmap ProcessNext(out Bitmap bmpIntermediate, out int nIntermediateIdx)
Process the next partial part of the solution. This function is only valid after calling Process with...
Definition: NeuralStyleTransfer.cs:920

MyCaffe.extras.NeuralStyleTransfer.Dispose
void Dispose()
Release all resources used.
Definition: NeuralStyleTransfer.cs:183

MyCaffe.extras.NeuralStyleTransfer.NeuralStyleTransfer
NeuralStyleTransfer(CudaDnn< T > cuda, Log log, CancelEvent evtCancel, string strModelType, string strModel, byte[] rgWeights, bool bCaffeModel, SolverParameter.SolverType solverType=SolverParameter.SolverType.LBFGS, double dfLearningRate=1.5, int nLBFGSCorrections=100, double dfDataScale=1.0, Net< T > netShare=null)
The constructor.
Definition: NeuralStyleTransfer.cs:89

MyCaffe.extras.NeuralStyleTransfer.ParseConfigurationString
static Dictionary< string, Tuple< double, double > > ParseConfigurationString(string strConfig, out string strSolver, out double dfLearningRate, out int nMaxImageSize, out int nIterations, out int nIntermediateIterations, out List< int > rgGpuID, out int nLBFGSCorrections, out double dfDataScale, out bool bAllowHs, out bool bAllowHsGram, out bool bAllowHsEvent, out bool bAllowHsScalar, out bool bAllowHsLoss)
The ParseConfigurationString method parses a deep draw configuration string into the actual settings.
Definition: NeuralStyleTransfer.cs:1085

MyCaffe.layers.Layer
An interface for the units of computation which can be composed into a Net.
Definition: Layer.cs:31

MyCaffe.layers.Layer.type
LayerParameter.LayerType type
Returns the LayerType of this Layer.
Definition: Layer.cs:927

MyCaffe.layers.nt.EventLayer
The EventLayer provides an event that fires on the forward pass and another that fires on the backwar...
Definition: EventLayer.cs:23

MyCaffe.layers.nt.EventLayer.OnBackward
EventHandler< BackwardArgs< T > > OnBackward
Defines the event that fires from within the backward pass.
Definition: EventLayer.cs:39

MyCaffe.param.BlobShape
Specifies the shape of a Blob.
Definition: BlobShape.cs:15

MyCaffe.param.InputParameter.shape
List< BlobShape > shape
Define N shapes to set a shape for each top. Define 1 shape to set the same shape for every top....
Definition: InputParameter.cs:36

MyCaffe.param.LayerParameter
Specifies the base parameter for all layers.
Definition: LayerParameter.cs:24

MyCaffe.param.LayerParameter.parameters
List< ParamSpec > parameters
Specifies the ParamSpec parameters of the LayerParameter.
Definition: LayerParameter.cs:1964

MyCaffe.param.LayerParameter.name
string name
Specifies the name of this LayerParameter.
Definition: LayerParameter.cs:1865

MyCaffe.param.LayerParameter.loss_weight
List< double > loss_weight
Specifies the loss weight.
Definition: LayerParameter.cs:1955

MyCaffe.param.LayerParameter.type
LayerType type
Specifies the type of this LayerParameter.
Definition: LayerParameter.cs:1874

MyCaffe.param.LayerParameter.use_halfsize
bool use_halfsize
Specifies whether or not to use half sized memory or not.
Definition: LayerParameter.cs:1882

MyCaffe.param.LayerParameter.gram_param
GramParameter gram_param
Returns the parameter set when initialized with LayerType.GRAM
Definition: LayerParameter.cs:2407

MyCaffe.param.LayerParameter.input_param
InputParameter input_param
Returns the parameter set when initialized with LayerType.INPUT
Definition: LayerParameter.cs:2957

MyCaffe.param.LayerParameter.top
List< string > top
Specifies the active top connections (in the bottom, out the top)
Definition: LayerParameter.cs:1919

MyCaffe.param.LayerParameter.scalar_param
ScalarParameter scalar_param
Returns the parameter set when initialized with LayerType.SCALAR
Definition: LayerParameter.cs:2758

MyCaffe.param.LayerParameter.bottom
List< string > bottom
Specifies the active bottom connections (in the bottom, out the top).
Definition: LayerParameter.cs:1910

MyCaffe.param.LayerParameter.LayerType
LayerType
Specifies the layer type.
Definition: LayerParameter.cs:110

MyCaffe.param.NetParameter
Specifies the parameters use to create a Net
Definition: NetParameter.cs:18

MyCaffe.param.NetParameter.FromProto
static NetParameter FromProto(RawProto rp)
Parse a RawProto into a new instance of the parameter.
Definition: NetParameter.cs:242

MyCaffe.param.NetParameter.layer
List< LayerParameter > layer
The layers that make up the net. Each of their configurations, including connectivity and behavior,...
Definition: NetParameter.cs:169

MyCaffe.param.ParamSpec
Specifies training parameters (multipliers on global learning constants, and the name of other settin...
Definition: ParamSpec.cs:19

MyCaffe.param.SolverParameter
The SolverParameter is a parameter for the solver, specifying the train and test networks.
Definition: SolverParameter.cs:32

MyCaffe.param.SolverParameter.lbgfs_corrections
int lbgfs_corrections
Specifies the number of lbgfs corrections used with the L-BGFS solver.
Definition: SolverParameter.cs:901

MyCaffe.param.SolverParameter.test_iter
List< int > test_iter
The number of iterations for each test.
Definition: SolverParameter.cs:359

MyCaffe.param.SolverParameter.train_net_param
NetParameter train_net_param
Inline train net param, possibly combined with one or more test nets.
Definition: SolverParameter.cs:304

MyCaffe.param.SolverParameter.SolverType
SolverType
Defines the type of solver.
Definition: SolverParameter.cs:113

MyCaffe.param.SolverParameter.test_interval
int test_interval
The number of iterations between two testing phases.
Definition: SolverParameter.cs:370

MyCaffe.param.SolverParameter.test_initialization
bool test_initialization
If true, run an initial test pass before the first iteration, ensuring memory availability and printi...
Definition: SolverParameter.cs:392

MyCaffe.param.SolverParameter.display
int display
The number of iterations between displaying info. If display = 0, no info will be displayed.
Definition: SolverParameter.cs:414

MyCaffe.param.SolverParameter.base_lr
double base_lr
The base learning rate (default = 0.01).
Definition: SolverParameter.cs:402

MyCaffe.param.SolverParameter.type
SolverType type
Specifies the solver type.
Definition: SolverParameter.cs:828

MyCaffe.param.TransformationParameter
Stores parameters used to apply transformation to the data layer's data.
Definition: TransformationParameter.cs:19

MyCaffe.param.TransformationParameter.COLOR_ORDER
COLOR_ORDER
Defines the color ordering used to tranform the input data.
Definition: TransformationParameter.cs:63

MyCaffe.param.TransformationParameter.mean_value
List< double > mean_value
If specified can be repeated once (would subtract it from all the channels or can be repeated the sam...
Definition: TransformationParameter.cs:156

MyCaffe.param.TransformationParameter.color_order
COLOR_ORDER color_order
Specifies the color ordering to use. Native Caffe models often uses COLOR_ORDER.BGR,...
Definition: TransformationParameter.cs:211

MyCaffe.param.TransformationParameter.scale
double scale
For data pre-processing, we can do simple scaling and subtracting the data mean, if provided....
Definition: TransformationParameter.cs:99

MyCaffe.param.nt.GramParameter.beta
double beta
Specifies the scaling factor applied after the gram operation.
Definition: GramParameter.cs:69

MyCaffe.param.nt.GramParameter.disable_scaling_on_gradient
bool disable_scaling_on_gradient
Specifies whether or not to apply the un-scaling of the alpha and beta values during the during the b...
Definition: GramParameter.cs:78

MyCaffe.param.nt.GramParameter.alpha
double alpha
Specifies the scaling factor applied before the gram operation.
Definition: GramParameter.cs:60

MyCaffe.param.nt.ScalarParameter
Specifies the parameters for the ScalarLayer
Definition: ScalarParameter.cs:16

MyCaffe.param.nt.ScalarParameter.value
double value
Specifies the scalar value to apply.
Definition: ScalarParameter.cs:48

MyCaffe.param.nt.ScalarParameter.operation
ScalarOp operation
Specifies the scalar operation to apply (mul, add, etc).
Definition: ScalarParameter.cs:58

MyCaffe.param.nt.ScalarParameter.passthrough_gradient
bool passthrough_gradient
Specifies whether or not to pass-through the gradient without performing the back-prop calculation (d...
Definition: ScalarParameter.cs:67

MyCaffe.param.nt.ScalarParameter.ScalarOp
ScalarOp
Defines the scalar operations that may be performed.
Definition: ScalarParameter.cs:25

MyCaffe.solvers.LBFGSSolver
Optimizes the parameters of a Net using L-BFGS. This implementation is based on minFunc,...
Definition: LBFGSSolver.cs:26

MyCaffe.solvers.Solver
An interface for classes that perform optimization on Nets - this class serves as the base class for ...
Definition: Solver.cs:28

MyCaffe.solvers.Solver.Dispose
void Dispose()
Discards the resources (GPU and Host) used by this Solver.
Definition: Solver.cs:218

MyCaffe.solvers.Solver.OnTrainingIteration
EventHandler< TrainingIterationArgs< T > > OnTrainingIteration
The OnTrainingIteration event fires at the end of each training iteration.
Definition: Solver.cs:134

MyCaffe.solvers.Solver.Create
static SGDSolver< T > Create(CudaDnn< T > cuda, Log log, ProjectEx p, CancelEvent evtCancel, AutoResetEvent evtForceSnapshot, AutoResetEvent evtForceTest, IXDatabaseBase db, IXPersist< T > persist, int nSolverCount=1, int nSolverRank=0, Net< T > shareNet=null, onGetWorkspace getws=null, onSetWorkspace setws=null)
Create a new Solver based on the project containing the SolverParameter.
Definition: Solver.cs:1889

MyCaffe.solvers.Solver.OnSnapshot
EventHandler< SnapshotArgs > OnSnapshot
The OnSnapshot event fires when the Solver detects that a snapshot is needed.
Definition: Solver.cs:130

MyCaffe.solvers.Solver.net
Net< T > net
Returns the main training Net.
Definition: Solver.cs:1229

MyCaffe.solvers.Solver.Step
bool Step(int nIters, TRAIN_STEP step=TRAIN_STEP.NONE, bool bZeroDiffs=true, bool bApplyUpdates=true, bool bDisableOutput=false, bool bDisableProgress=false, double? dfLossOverride=null, bool? bAllowSnapshot=null)
Steps a set of iterations through a training cycle.
Definition: Solver.cs:818

MyCaffe.basecode
The MyCaffe.basecode contains all generic types used throughout MyCaffe.
Definition: Annotation.cs:12

MyCaffe.basecode.Phase
Phase
Defines the Phase under which to run a Net.
Definition: Interfaces.cs:61

MyCaffe.common
The MyCaffe.common namespace contains common MyCaffe classes.
Definition: BatchInput.cs:8

MyCaffe.common.TRAIN_STEP
TRAIN_STEP
Defines the training stepping method (if any).
Definition: Interfaces.cs:131

MyCaffe.data
The MyCaffe.data namespace contains dataset creators used to create common testing datasets such as M...
Definition: BinaryFile.cs:16

MyCaffe.extras
The MyCaffe.extras namespace contains classes that use the MyCaffe and other namespaces to add enhanc...
Definition: DeepDraw.cs:17

MyCaffe.layers.nt
The MyCaffe.layers.nt namespace contains all Neural Transfer related layers.
Definition: LayerFactory.cs:19

MyCaffe.layers
The MyCaffe.layers namespace contains all layers that have a solidified code base,...
Definition: LayerFactory.cs:15

MyCaffe.param.nt
The MyCaffe.param.nt namespace defines the parameters used by the Nerual Style Transfer layers.
Definition: GramParameter.cs:18

MyCaffe.param
The MyCaffe.param namespace contains parameters used to create models.
Definition: AttentionParameter.cs:9

MyCaffe.solvers
The MyCaffe.solvers namespace contains all solver classes, including the base Solver.
Definition: AdaDeltaSolver.cs:13

MyCaffe
The MyCaffe namespace contains the main body of MyCaffe code that closesly tracks the C++ Caffe open-...
Definition: Annotation.cs:12

System
Definition: Component.cs:11