From 652472ce805505c29f3eec9753c7ef83a79f02bc Mon Sep 17 00:00:00 2001
From: Senja Filipi <sefilipi@microsoft.com>
Date: Thu, 27 Sep 2018 13:56:53 -0700
Subject: [PATCH 01/10] AP xtensions

---
 .../Standard/LinearClassificationTrainer.cs   |   2 +-
 .../Standard/Online/AveragedLinear.cs         |  13 +-
 .../Standard/Online/AveragedPerceptron.cs     |  18 +-
 .../Standard/Online/LinearSvm.cs              |  17 +-
 .../Standard/Online/OnlineLearnerStatic.cs    | 205 ++++++++++++++++++
 .../Standard/Online/OnlineLinear.cs           |   7 +-
 .../Standard/SdcaStatic.cs                    |   4 +-
 .../Training.cs                               |  85 +++++++-
 8 files changed, 322 insertions(+), 29 deletions(-)
 create mode 100644 src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs
diff --git a/src/Microsoft.ML.StandardLearners/Standard/LinearClassificationTrainer.cs b/src/Microsoft.ML.StandardLearners/Standard/LinearClassificationTrainer.cs
index 8722b79ea6..29e2e1e89f 100644
--- a/src/Microsoft.ML.StandardLearners/Standard/LinearClassificationTrainer.cs
+++ b/src/Microsoft.ML.StandardLearners/Standard/LinearClassificationTrainer.cs
@@ -1359,7 +1359,7 @@ public void Add(Double summand)
     public sealed class LinearClassificationTrainer : SdcaTrainerBase<BinaryPredictionTransformer<TScalarPredictor>, TScalarPredictor>
     {
         public const string LoadNameValue = "SDCA";
-        public const string UserNameValue = "Fast Linear (SA-SDCA)";
+        internal const string UserNameValue = "Fast Linear (SA-SDCA)";
 
         public sealed class Arguments : ArgumentsBase
         {
diff --git a/src/Microsoft.ML.StandardLearners/Standard/Online/AveragedLinear.cs b/src/Microsoft.ML.StandardLearners/Standard/Online/AveragedLinear.cs
index 70ee279a1c..c2656bd6f5 100644
--- a/src/Microsoft.ML.StandardLearners/Standard/Online/AveragedLinear.cs
+++ b/src/Microsoft.ML.StandardLearners/Standard/Online/AveragedLinear.cs
@@ -22,12 +22,12 @@ public abstract class AveragedLinearArguments : OnlineLinearArguments
         [Argument(ArgumentType.AtMostOnce, HelpText = "Learning rate", ShortName = "lr", SortOrder = 50)]
         [TGUI(Label = "Learning rate", SuggestedSweeps = "0.01,0.1,0.5,1.0")]
         [TlcModule.SweepableDiscreteParam("LearningRate", new object[] { 0.01, 0.1, 0.5, 1.0 })]
-        public Float LearningRate = 1;
+        public Float LearningRate = DefaultAveragedArgs.LearningRate;
 
         [Argument(ArgumentType.AtMostOnce, HelpText = "Decrease learning rate", ShortName = "decreaselr", SortOrder = 50)]
         [TGUI(Label = "Decrease Learning Rate", Description = "Decrease learning rate as iterations progress")]
         [TlcModule.SweepableDiscreteParam("DecreaseLearningRate", new object[] { false, true })]
-        public bool DecreaseLearningRate = false;
+        public bool DecreaseLearningRate = DefaultAveragedArgs.DecreaseLearningRate;
 
         [Argument(ArgumentType.AtMostOnce, HelpText = "Number of examples after which weights will be reset to the current average", ShortName = "numreset")]
         public long? ResetWeightsAfterXExamples = null;
@@ -38,7 +38,7 @@ public abstract class AveragedLinearArguments : OnlineLinearArguments
         [Argument(ArgumentType.AtMostOnce, HelpText = "L2 Regularization Weight", ShortName = "reg", SortOrder = 50)]
         [TGUI(Label = "L2 Regularization Weight")]
         [TlcModule.SweepableFloatParam("L2RegularizerWeight", 0.0f, 0.4f)]
-        public Float L2RegularizerWeight = 0;
+        public Float L2RegularizerWeight = DefaultAveragedArgs.L2RegularizerWeight;
 
         [Argument(ArgumentType.AtMostOnce, HelpText = "Extra weight given to more recent updates", ShortName = "rg")]
         public Float RecencyGain = 0;
@@ -51,6 +51,13 @@ public abstract class AveragedLinearArguments : OnlineLinearArguments
 
         [Argument(ArgumentType.AtMostOnce, HelpText = "The inexactness tolerance for averaging", ShortName = "avgtol")]
         public Float AveragedTolerance = (Float)1e-2;
+
+        internal static class DefaultAveragedArgs
+        {
+            internal const Float LearningRate = 1;
+            internal const bool DecreaseLearningRate = false;
+            internal const Float L2RegularizerWeight = 0;
+        }
     }
 
     public abstract class AveragedLinearTrainer<TTransformer, TModel> : OnlineLinearTrainer<TTransformer, TModel>
diff --git a/src/Microsoft.ML.StandardLearners/Standard/Online/AveragedPerceptron.cs b/src/Microsoft.ML.StandardLearners/Standard/Online/AveragedPerceptron.cs
index f5a1dc44f5..4862caa4d6 100644
--- a/src/Microsoft.ML.StandardLearners/Standard/Online/AveragedPerceptron.cs
+++ b/src/Microsoft.ML.StandardLearners/Standard/Online/AveragedPerceptron.cs
@@ -57,23 +57,23 @@ public AveragedPerceptronTrainer(IHostEnvironment env, Arguments args)
         {
             _args = args;
             LossFunction = _args.LossFunction.CreateComponent(env);
+        }
+
+        public override PredictionKind PredictionKind => PredictionKind.BinaryClassification;
 
-            _outputColumns = new[]
+        protected override bool NeedCalibration => true;
+
+        protected override SchemaShape.Column[] GetOutputColumnsCore(SchemaShape inputSchema)
+        {
+            return new[]
             {
                 new SchemaShape.Column(DefaultColumnNames.Score, SchemaShape.Column.VectorKind.Scalar, NumberType.R4, false, new SchemaShape(MetadataUtils.GetTrainerOutputMetadata())),
+                //sefilipi: should it be here, since NeedCalibration is true?
                 new SchemaShape.Column(DefaultColumnNames.Probability, SchemaShape.Column.VectorKind.Scalar, NumberType.R4, false, new SchemaShape(MetadataUtils.GetTrainerOutputMetadata(true))),
                 new SchemaShape.Column(DefaultColumnNames.PredictedLabel, SchemaShape.Column.VectorKind.Scalar, BoolType.Instance, false, new SchemaShape(MetadataUtils.GetTrainerOutputMetadata()))
             };
         }
 
-        public override PredictionKind PredictionKind => PredictionKind.BinaryClassification;
-
-        protected override bool NeedCalibration => true;
-
-        private readonly SchemaShape.Column[] _outputColumns;
-
-        protected override SchemaShape.Column[] GetOutputColumnsCore(SchemaShape inputSchema) => _outputColumns;
-
         protected override void CheckLabel(RoleMappedData data)
         {
             Contracts.AssertValue(data);
diff --git a/src/Microsoft.ML.StandardLearners/Standard/Online/LinearSvm.cs b/src/Microsoft.ML.StandardLearners/Standard/Online/LinearSvm.cs
index ad8442433d..d312c6b52b 100644
--- a/src/Microsoft.ML.StandardLearners/Standard/Online/LinearSvm.cs
+++ b/src/Microsoft.ML.StandardLearners/Standard/Online/LinearSvm.cs
@@ -34,8 +34,8 @@ namespace Microsoft.ML.Runtime.Learners
     /// </summary>
     public sealed class LinearSvm : OnlineLinearTrainer<BinaryPredictionTransformer<LinearBinaryPredictor>, LinearBinaryPredictor>
     {
-        public const string LoadNameValue = "LinearSVM";
-        public const string ShortName = "svm";
+        internal const string LoadNameValue = "LinearSVM";
+        internal const string ShortName = "svm";
         internal const string UserNameValue = "SVM (Pegasos-Linear)";
         internal const string Summary = "The idea behind support vector machines, is to map the instances into a high dimensional space "
             + "in which instances of the two classes are linearly separable, i.e., there exists a hyperplane such that all the positive examples are on one side of it, "
@@ -92,8 +92,13 @@ public LinearSvm(IHostEnvironment env, Arguments args)
             Contracts.CheckUserArg(args.BatchSize > 0, nameof(args.BatchSize), UserErrorPositive);
 
             Args = args;
+        }
+
+        public override PredictionKind PredictionKind => PredictionKind.BinaryClassification;
 
-            _outputColumns = new[]
+        protected override SchemaShape.Column[] GetOutputColumnsCore(SchemaShape inputSchema)
+        {
+            return new[]
             {
                 new SchemaShape.Column(DefaultColumnNames.Score, SchemaShape.Column.VectorKind.Scalar, NumberType.R4, false),
                 new SchemaShape.Column(DefaultColumnNames.Probability, SchemaShape.Column.VectorKind.Scalar, NumberType.R4, false),
@@ -101,12 +106,6 @@ public LinearSvm(IHostEnvironment env, Arguments args)
             };
         }
 
-        public override PredictionKind PredictionKind => PredictionKind.BinaryClassification;
-
-        private readonly SchemaShape.Column[] _outputColumns;
-
-        protected override SchemaShape.Column[] GetOutputColumnsCore(SchemaShape inputSchema) => _outputColumns;
-
         protected override void CheckLabel(RoleMappedData data)
         {
             Contracts.AssertValue(data);
diff --git a/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs b/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs
new file mode 100644
index 0000000000..afa2790821
--- /dev/null
+++ b/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs
@@ -0,0 +1,205 @@
+﻿// Licensed to the .NET Foundation under one or more agreements.
+// The .NET Foundation licenses this file to you under the MIT license.
+// See the LICENSE file in the project root for more information.
+
+using Microsoft.ML.Runtime;
+using Microsoft.ML.Runtime.Data;
+using Microsoft.ML.Runtime.Internal.Calibration;
+using Microsoft.ML.Runtime.Learners;
+using Microsoft.ML.StaticPipe;
+using Microsoft.ML.StaticPipe.Runtime;
+using System;
+
+namespace Microsoft.ML.Trainers
+{
+    public static class OnlineLearnerStatic
+    {
+        /// <summary>
+        /// Predict a target using a linear binary classification model trained with the SDCA trainer, and a custom loss.
+        /// Note that because we cannot be sure that all loss functions will produce naturally calibrated outputs, setting
+        /// a custom loss function will not produce a calibrated probability column.
+        /// </summary>
+        /// <param name="ctx">The binary classification context trainer object.</param>
+        /// <param name="label">The label, or dependent variable.</param>
+        /// <param name="features">The features, or independent variables.</param>
+        /// <param name="lossFunction">The custom loss.</param>
+        /// <param name="weights">The optional example weights.</param>
+        /// <param name="learningRate">The learning Rate.</param>
+        /// <param name="decreaseLearningRate">Decrease learning rate as iterations progress.</param>
+        /// <param name="l2RegularizerWeight">L2 Regularization Weight.</param>
+        /// <param name="numIterations">Number of training iterations through the data.</param>
+        /// <param name="onFit">A delegate that is called every time the
+        /// <see cref="Estimator{TTupleInShape, TTupleOutShape, TTransformer}.Fit(DataView{TTupleInShape})"/> method is called on the
+        /// <see cref="Estimator{TTupleInShape, TTupleOutShape, TTransformer}"/> instance created out of this. This delegate will receive
+        /// the linear model that was trained, as well as the calibrator on top of that model. Note that this action cannot change the
+        /// result in any way; it is only a way for the caller to be informed about what was learnt.</param>
+        /// <returns>The set of output columns including in order the predicted binary classification score (which will range
+        /// from negative to positive infinity), and the predicted label.</returns>
+        /// <seealso cref="AveragedPerceptronTrainer"/>.
+        public static (Scalar<float> score, Scalar<bool> predictedLabel) AveragedPerceptron(
+                this BinaryClassificationContext.BinaryClassificationTrainers ctx,
+                IClassificationLoss lossFunction,
+                Scalar<bool> label, Vector<float> features, Scalar<float> weights = null,
+                float learningRate = AveragedLinearArguments.DefaultAveragedArgs.LearningRate,
+                bool decreaseLearningRate = AveragedLinearArguments.DefaultAveragedArgs.DecreaseLearningRate,
+                float l2RegularizerWeight = AveragedLinearArguments.DefaultAveragedArgs.L2RegularizerWeight,
+                int numIterations = OnlineLinearArguments.DefaultArgs.NumIterations,
+                Action<LinearBinaryPredictor> onFit = null
+            )
+        {
+            Contracts.CheckValue(label, nameof(label));
+            Contracts.CheckValue(features, nameof(features));
+            Contracts.CheckValue(lossFunction, nameof(lossFunction));
+            Contracts.CheckValueOrNull(weights);
+            Contracts.CheckParam(learningRate > 0, nameof(learningRate), "Must be positive.");
+            Contracts.CheckParam(0 <= l2RegularizerWeight && l2RegularizerWeight < 0.5, nameof(l2RegularizerWeight), "must be in range [0, 0.5)");
+
+            Contracts.CheckParam(numIterations > 1, nameof(numIterations), "Must be greater than one, if specified.");
+            Contracts.CheckValueOrNull(onFit);
+
+            bool hasProbs = lossFunction is HingeLoss;
+
+            var args = new AveragedPerceptronTrainer.Arguments()
+            {
+                LearningRate = learningRate,
+                DecreaseLearningRate = decreaseLearningRate,
+                L2RegularizerWeight = l2RegularizerWeight,
+                NumIterations = numIterations
+            };
+
+            if (lossFunction != null)
+                args.LossFunction = new TrivialClassificationLossFactory(lossFunction);
+
+            var rec = new TrainerEstimatorReconciler.BinaryClassifierNoCalibration(
+                (env, labelName, featuresName, weightsName) =>
+                {
+                    args.FeatureColumn = featuresName;
+                    args.LabelColumn = labelName;
+                    args.InitialWeights = weightsName;
+
+                    var trainer = new AveragedPerceptronTrainer(env, args);
+
+                    if (onFit != null)
+                        return trainer.WithOnFitDelegate(trans => onFit(trans.Model));
+                    else
+                        return trainer;
+
+                    /*
+                    if (onFit != null)
+                    {
+                        return trainer.WithOnFitDelegate(trans =>
+                        {
+                            var model = trans.Model;
+                            if (model is ParameterMixingCalibratedPredictor cali)
+                                onFit((LinearBinaryPredictor)cali.SubPredictor);
+                            else
+                                onFit((LinearBinaryPredictor)model);
+                        });
+                    }
+                    return trainer;
+                    */
+
+                }, label, features, weights, hasProbs);
+
+            return rec.Output;
+        }
+
+        /// <summary>
+        /// Predict a target using a linear binary classification model trained with the AveragePerceptron trainer, and a custom loss.
+        /// Note that because we cannot be sure that all loss functions will produce naturally calibrated outputs, setting
+        /// a custom loss function will not produce a calibrated probability column.
+        /// </summary>
+        /// <param name="ctx">The binary classification context trainer object.</param>
+        /// <param name="label">The label, or dependent variable.</param>
+        /// <param name="features">The features, or independent variables.</param>
+        /// <param name="weights">The optional example weights.</param>
+        /// <param name="lossFunction">The custom loss.</param>
+        /// <param name="learningRate">The learning Rate.</param>
+        /// <param name="decreaseLearningRate">Decrease learning rate as iterations progress.</param>
+        /// <param name="l2RegularizerWeight">L2 Regularization Weight.</param>
+        /// <param name="numIterations">Number of training iterations through the data.</param>
+        /// <param name="onFit">A delegate that is called every time the
+        /// <see cref="Estimator{TTupleInShape, TTupleOutShape, TTransformer}.Fit(DataView{TTupleInShape})"/> method is called on the
+        /// <see cref="Estimator{TTupleInShape, TTupleOutShape, TTransformer}"/> instance created out of this. This delegate will receive
+        /// the linear model that was trained, as well as the calibrator on top of that model. Note that this action cannot change the
+        /// result in any way; it is only a way for the caller to be informed about what was learnt.</param>
+        /// <returns>The set of output columns including in order the predicted binary classification score (which will range
+        /// from negative to positive infinity), and the predicted label.</returns>
+        /// <seealso cref="AveragedPerceptronTrainer"/>.
+        /// <returns>The set of output columns including in order the predicted per-class likelihoods (between 0 and 1, and summing up to 1), and the predicted label.</returns>
+        public static (Scalar<float> score, Scalar<float> probability, Scalar<bool> predictedLabel)
+            AveragedPerceptron(this BinaryClassificationContext.BinaryClassificationTrainers ctx,
+                Scalar<bool> label,
+                Vector<float> features,
+                IClassificationLoss lossFunction = null,
+                Scalar<float> weights = null,
+                float learningRate = AveragedLinearArguments.DefaultAveragedArgs.LearningRate,
+                bool decreaseLearningRate = AveragedLinearArguments.DefaultAveragedArgs.DecreaseLearningRate,
+                float l2RegularizerWeight = AveragedLinearArguments.DefaultAveragedArgs.L2RegularizerWeight,
+                int numIterations = OnlineLinearArguments.DefaultArgs.NumIterations,
+                Action<LinearBinaryPredictor> onFit = null)
+        {
+            Contracts.CheckValue(label, nameof(label));
+            Contracts.CheckValue(features, nameof(features));
+            Contracts.CheckValueOrNull(weights);
+            Contracts.CheckParam(learningRate > 0, nameof(learningRate), "Must be positive.");
+            Contracts.CheckParam(0 <= l2RegularizerWeight && l2RegularizerWeight < 0.5, nameof(l2RegularizerWeight), "must be in range [0, 0.5)");
+
+            Contracts.CheckParam(numIterations > 1, nameof(numIterations), "Must be greater than one, if specified.");
+            Contracts.CheckValueOrNull(onFit);
+
+            var args = new AveragedPerceptronTrainer.Arguments()
+            {
+                LearningRate = learningRate,
+                DecreaseLearningRate = decreaseLearningRate,
+                L2RegularizerWeight = l2RegularizerWeight,
+                NumIterations = numIterations
+            };
+
+            if (lossFunction != null)
+                args.LossFunction = new TrivialClassificationLossFactory(lossFunction);
+
+            var rec = new TrainerEstimatorReconciler.BinaryClassifier(
+                (env, labelName, featuresName, weightsName) =>
+                {
+                    args.FeatureColumn = featuresName;
+                    args.LabelColumn = labelName;
+                    args.InitialWeights = weightsName;
+
+                    var trainer = new AveragedPerceptronTrainer(env, args);
+                    if (onFit != null)
+                    {
+                        return trainer.WithOnFitDelegate(trans => onFit(trans.Model));
+                        /*
+                        return trainer.WithOnFitDelegate(trans =>
+                        {
+                            // Under the default log-loss we assume a calibrated predictor.
+                            var model = trans.Model;
+                            var cali = (ParameterMixingCalibratedPredictor)model;
+                            var pred = (LinearBinaryPredictor)cali.SubPredictor;
+                            onFit(pred, cali);
+                        });
+                        */
+                    }
+                    return trainer;
+                }, label, features, weights);
+
+            return rec.Output;
+        }
+
+        private sealed class TrivialClassificationLossFactory : ISupportClassificationLossFactory
+        {
+            private readonly IClassificationLoss _loss;
+
+            public TrivialClassificationLossFactory(IClassificationLoss loss)
+            {
+                _loss = loss;
+            }
+
+            public IClassificationLoss CreateComponent(IHostEnvironment env)
+            {
+                return _loss;
+            }
+        }
+    }
+}
diff --git a/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLinear.cs b/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLinear.cs
index 15bd5da290..fb28bfe23a 100644
--- a/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLinear.cs
+++ b/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLinear.cs
@@ -24,7 +24,7 @@ public abstract class OnlineLinearArguments : LearnerInputBaseWithLabel
         [Argument(ArgumentType.AtMostOnce, HelpText = "Number of iterations", ShortName = "iter", SortOrder = 50)]
         [TGUI(Label = "Number of Iterations", Description = "Number of training iterations through data", SuggestedSweeps = "1,10,100")]
         [TlcModule.SweepableLongParamAttribute("NumIterations", 1, 100, stepSize: 10, isLogScale: true)]
-        public int NumIterations = 1;
+        public int NumIterations = DefaultArgs.NumIterations;
 
         [Argument(ArgumentType.AtMostOnce, HelpText = "Initial Weights and bias, comma-separated", ShortName = "initweights")]
         [TGUI(NoSweep = true)]
@@ -41,6 +41,11 @@ public abstract class OnlineLinearArguments : LearnerInputBaseWithLabel
 
         [Argument(ArgumentType.AtMostOnce, HelpText = "Size of cache when trained in Scope", ShortName = "cache")]
         public int StreamingCacheSize = 1000000;
+
+        internal static class DefaultArgs
+        {
+            internal const int NumIterations = 1;
+        }
     }
 
     public abstract class OnlineLinearTrainer<TTransformer, TModel> : TrainerEstimatorBase<TTransformer, TModel>
diff --git a/src/Microsoft.ML.StandardLearners/Standard/SdcaStatic.cs b/src/Microsoft.ML.StandardLearners/Standard/SdcaStatic.cs
index 113092ed26..6c4995bfa7 100644
--- a/src/Microsoft.ML.StandardLearners/Standard/SdcaStatic.cs
+++ b/src/Microsoft.ML.StandardLearners/Standard/SdcaStatic.cs
@@ -142,7 +142,7 @@ public static (Scalar<float> score, Scalar<float> probability, Scalar<bool> pred
         /// <param name="ctx">The binary classification context trainer object.</param>
         /// <param name="label">The label, or dependent variable.</param>
         /// <param name="features">The features, or independent variables.</param>
-        /// /// <param name="loss">The custom loss.</param>
+        /// <param name="loss">The custom loss.</param>
         /// <param name="weights">The optional example weights.</param>
         /// <param name="l2Const">The L2 regularization hyperparameter.</param>
         /// <param name="l1Threshold">The L1 regularization hyperparameter. Higher values will tend to lead to more sparse model.</param>
@@ -212,7 +212,7 @@ public static (Scalar<float> score, Scalar<bool> predictedLabel) Sdca(
         /// <param name="ctx">The multiclass classification context trainer object.</param>
         /// <param name="label">The label, or dependent variable.</param>
         /// <param name="features">The features, or independent variables.</param>
-        /// /// <param name="loss">The custom loss.</param>
+        /// <param name="loss">The custom loss.</param>
         /// <param name="weights">The optional example weights.</param>
         /// <param name="l2Const">The L2 regularization hyperparameter.</param>
         /// <param name="l1Threshold">The L1 regularization hyperparameter. Higher values will tend to lead to more sparse model.</param>
diff --git a/test/Microsoft.ML.StaticPipelineTesting/Training.cs b/test/Microsoft.ML.StaticPipelineTesting/Training.cs
index bfd9bfa456..b7bf2606d4 100644
--- a/test/Microsoft.ML.StaticPipelineTesting/Training.cs
+++ b/test/Microsoft.ML.StaticPipelineTesting/Training.cs
@@ -144,7 +144,7 @@ public void SdcaBinaryClassification()
         }
 
         [Fact]
-        public void SdcaBinaryClassificationNoClaibration()
+        public void SdcaBinaryClassificationNoCalibration()
         {
             var env = new ConsoleEnvironment(seed: 0);
             var dataPath = GetDataPath(TestDatasets.breastCancer.trainFilename);
@@ -160,9 +160,9 @@ public void SdcaBinaryClassificationNoClaibration()
 
             // With a custom loss function we no longer get calibrated predictions.
             var est = reader.MakeNewEstimator()
-                .Append(r => (r.label, preds: ctx.Trainers.Sdca(r.label, r.features,
-                maxIterations: 2,
-                loss: loss, onFit: p => pred = p)));
+                .Append(r => (r.label, preds: ctx.Trainers.AveragedPerceptron(loss, r.label, r.features,
+                numIterations: 2,
+                onFit: p => pred = p)));
 
             var pipe = reader.Append(est);
 
@@ -186,6 +186,83 @@ public void SdcaBinaryClassificationNoClaibration()
                 Console.WriteLine($"{schema.GetColumnName(c)}, {schema.GetColumnType(c)}");
         }
 
+        [Fact]
+        public void AveragePerceptron()
+        {
+            var env = new ConsoleEnvironment(seed: 0);
+            var dataPath = GetDataPath(TestDatasets.breastCancer.trainFilename);
+            var dataSource = new MultiFileSource(dataPath);
+            var ctx = new BinaryClassificationContext(env);
+
+            var reader = TextLoader.CreateReader(env,
+                c => (label: c.LoadBool(0), features: c.LoadFloat(1, 9)));
+
+            LinearBinaryPredictor pred = null;
+            // ParameterMixingCalibratedPredictor cali = null;
+
+            var est = reader.MakeNewEstimator()
+                .Append(r => (r.label, preds: ctx.Trainers.AveragedPerceptron(r.label, r.features,
+                    numIterations: 2,
+                    onFit: (p) => { pred = p; })));
+
+            var pipe = reader.Append(est);
+
+            Assert.Null(pred);
+            //Assert.Null(cali);
+            var model = pipe.Fit(dataSource);
+            Assert.NotNull(pred);
+            //Assert.NotNull(cali);
+            // 9 input features, so we ought to have 9 weights.
+            Assert.Equal(9, pred.Weights2.Count);
+
+            var data = model.Read(dataSource);
+
+            var metrics = ctx.Evaluate(data, r => r.label, r => r.preds);
+            // Run a sanity check against a few of the metrics.
+            Assert.InRange(metrics.Accuracy, 0, 1);
+            Assert.InRange(metrics.Auc, 0, 1);
+            Assert.InRange(metrics.Auprc, 0, 1);
+            Assert.InRange(metrics.LogLoss, 0, double.PositiveInfinity);
+            Assert.InRange(metrics.Entropy, 0, double.PositiveInfinity);
+        }
+
+        [Fact]
+        public void AveragePerceptronNoCalibration()
+        {
+            var env = new ConsoleEnvironment(seed: 0);
+            var dataPath = GetDataPath(TestDatasets.breastCancer.trainFilename);
+            var dataSource = new MultiFileSource(dataPath);
+            var ctx = new BinaryClassificationContext(env);
+
+            var reader = TextLoader.CreateReader(env,
+                c => (label: c.LoadBool(0), features: c.LoadFloat(1, 9)));
+
+            LinearBinaryPredictor pred = null;
+
+            var loss = new HingeLoss(new HingeLoss.Arguments() { Margin = 1 });
+
+            // With a custom loss function we no longer get calibrated predictions.
+            var est = reader.MakeNewEstimator()
+                .Append(r => (r.label, preds: ctx.Trainers.AveragedPerceptron(loss, r.label, r.features,
+                numIterations: 2, onFit: p => pred = p)));
+
+            var pipe = reader.Append(est);
+
+            Assert.Null(pred);
+            var model = pipe.Fit(dataSource);
+            Assert.NotNull(pred);
+            // 9 input features, so we ought to have 9 weights.
+            Assert.Equal(9, pred.Weights2.Count);
+
+            var data = model.Read(dataSource);
+
+            var metrics = ctx.Evaluate(data, r => r.label, r => r.preds);
+            // Run a sanity check against a few of the metrics.
+            Assert.InRange(metrics.Accuracy, 0, 1);
+            Assert.InRange(metrics.Auc, 0, 1);
+            Assert.InRange(metrics.Auprc, 0, 1);
+        }
+
         [Fact]
         public void FfmBinaryClassification()
         {

From 5b5927c92724b6797f6978532981b5790e2a095f Mon Sep 17 00:00:00 2001
From: Senja Filipi <sefilipi@microsoft.com>
Date: Thu, 27 Sep 2018 15:35:43 -0700
Subject: [PATCH 02/10] lbfgs derived classes take more arguments in their
 public ctors adding pigstensions for lr, multilr, possion

---
 .../LogisticRegression/LbfgsPredictorBase.cs  |  54 ++++--
 .../LogisticRegression/LbfgsStatics.cs        | 179 ++++++++++++++++++
 .../LogisticRegression/LogisticRegression.cs  |  22 ++-
 .../MulticlassLogisticRegression.cs           |  16 +-
 .../PoissonRegression/PoissonRegression.cs    |  16 +-
 .../Training.cs                               | 123 ++++++++++++
 .../TrainerEstimators/LbfgsTests.cs           |   3 -
 7 files changed, 388 insertions(+), 25 deletions(-)
 create mode 100644 src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LbfgsStatics.cs

diff --git a/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LbfgsPredictorBase.cs b/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LbfgsPredictorBase.cs
index 4286f83379..a0bedf1c11 100644
--- a/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LbfgsPredictorBase.cs
+++ b/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LbfgsPredictorBase.cs
@@ -26,29 +26,29 @@ public abstract class ArgumentsBase : LearnerInputBaseWithWeight
             [Argument(ArgumentType.AtMostOnce, HelpText = "L2 regularization weight", ShortName = "l2", SortOrder = 50)]
             [TGUI(Label = "L2 Weight", Description = "Weight of L2 regularizer term", SuggestedSweeps = "0,0.1,1")]
             [TlcModule.SweepableFloatParamAttribute(0.0f, 1.0f, numSteps: 4)]
-            public float L2Weight = 1;
+            public float L2Weight = Defaults.L2Weight;
 
             [Argument(ArgumentType.AtMostOnce, HelpText = "L1 regularization weight", ShortName = "l1", SortOrder = 50)]
             [TGUI(Label = "L1 Weight", Description = "Weight of L1 regularizer term", SuggestedSweeps = "0,0.1,1")]
             [TlcModule.SweepableFloatParamAttribute(0.0f, 1.0f, numSteps: 4)]
-            public float L1Weight = 1;
+            public float L1Weight = Defaults.L1Weight;
 
             [Argument(ArgumentType.AtMostOnce, HelpText = "Tolerance parameter for optimization convergence. Lower = slower, more accurate",
                 ShortName = "ot", SortOrder = 50)]
             [TGUI(Label = "Optimization Tolerance", Description = "Threshold for optimizer convergence", SuggestedSweeps = "1e-4,1e-7")]
             [TlcModule.SweepableDiscreteParamAttribute(new object[] { 1e-4f, 1e-7f })]
-            public float OptTol = 1e-7f;
+            public float OptTol = Defaults.OptTol;
 
             [Argument(ArgumentType.AtMostOnce, HelpText = "Memory size for L-BFGS. Lower=faster, less accurate",
                 ShortName = "m", SortOrder = 50)]
             [TGUI(Description = "Memory size for L-BFGS", SuggestedSweeps = "5,20,50")]
             [TlcModule.SweepableDiscreteParamAttribute("MemorySize", new object[] { 5, 20, 50 })]
-            public int MemorySize = 20;
+            public int MemorySize = Defaults.MemorySize;
 
             [Argument(ArgumentType.AtMostOnce, HelpText = "Maximum iterations.", ShortName = "maxiter")]
             [TGUI(Label = "Max Number of Iterations")]
             [TlcModule.SweepableLongParamAttribute("MaxIterations", 1, int.MaxValue)]
-            public int MaxIterations = int.MaxValue;
+            public int MaxIterations = Defaults.MaxIterations;
 
             [Argument(ArgumentType.AtMostOnce, HelpText = "Run SGD to initialize LR weights, converging to this tolerance",
                 ShortName = "sgd")]
@@ -90,7 +90,17 @@ public abstract class ArgumentsBase : LearnerInputBaseWithWeight
             public bool DenseOptimizer = false;
 
             [Argument(ArgumentType.AtMostOnce, HelpText = "Enforce non-negative weights", ShortName = "nn", SortOrder = 90)]
-            public bool EnforceNonNegativity = false;
+            public bool EnforceNonNegativity = Defaults.EnforceNonNegativity;
+
+            internal static class Defaults
+            {
+                internal const float L2Weight = 1;
+                internal const float L1Weight = 1;
+                internal const float OptTol = 1e-7f;
+                internal const int MemorySize = 20;
+                internal const int MaxIterations = int.MaxValue;
+                internal const bool EnforceNonNegativity = false;
+            }
         }
 
         private const string RegisterName = nameof(LbfgsTrainerBase<TArgs, TTransformer, TModel>);
@@ -142,12 +152,22 @@ public abstract class ArgumentsBase : LearnerInputBaseWithWeight
         public override TrainerInfo Info => _info;
 
         internal LbfgsTrainerBase(IHostEnvironment env, string featureColumn, SchemaShape.Column labelColumn,
-            string weightColumn = null, Action<TArgs> advancedSettings = null)
-            : this(env, ArgsInit(featureColumn, labelColumn, weightColumn, advancedSettings), labelColumn)
+            string weightColumn, Action<TArgs> advancedSettings, float l1Weight,
+            float l2Weight,
+            float optimizationTolerance,
+            int memorySize,
+            bool enforceNoNegativity)
+            : this(env, ArgsInit(featureColumn, labelColumn, weightColumn, advancedSettings), labelColumn,
+                  l1Weight, l2Weight, optimizationTolerance, memorySize, enforceNoNegativity)
         {
         }
 
-        internal LbfgsTrainerBase(IHostEnvironment env, TArgs args, SchemaShape.Column labelColumn)
+        internal LbfgsTrainerBase(IHostEnvironment env, TArgs args, SchemaShape.Column labelColumn,
+            float? l1Weight = null,
+            float? l2Weight = null,
+            float? optimizationTolerance = null,
+            int? memorySize = null,
+            bool? enforceNoNegativity = null)
             : base(Contracts.CheckRef(env, nameof(env)).Register(RegisterName), TrainerUtils.MakeR4VecFeature(args.FeatureColumn),
                   labelColumn, TrainerUtils.MakeR4ScalarWeightColumn(args.WeightColumn))
         {
@@ -164,10 +184,16 @@ internal LbfgsTrainerBase(IHostEnvironment env, TArgs args, SchemaShape.Column l
             Contracts.CheckUserArg(Args.SgdInitializationTolerance >= 0, nameof(Args.SgdInitializationTolerance), "Must be non-negative");
             Contracts.CheckUserArg(Args.NumThreads == null || Args.NumThreads.Value >= 0, nameof(Args.NumThreads), "Must be non-negative");
 
-            L2Weight = Args.L2Weight;
-            L1Weight = Args.L1Weight;
-            OptTol = Args.OptTol;
-            MemorySize = Args.MemorySize;
+            Contracts.CheckParam(l2Weight >= 0, nameof(l2Weight), "Must be non-negative, if provided.");
+            Contracts.CheckParam(l1Weight >= 0, nameof(l1Weight), "Must be non-negative, if provided");
+            Contracts.CheckParam(optimizationTolerance > 0, nameof(optimizationTolerance), "Must be positive, if provided.");
+            Contracts.CheckParam(memorySize > 0, nameof(memorySize), "Must be positive, if provided.");
+
+            // Review: Warn about the overriding behavior
+            L2Weight = l2Weight ?? Args.L2Weight;
+            L1Weight = l1Weight ?? Args.L1Weight;
+            OptTol = optimizationTolerance ?? Args.OptTol;
+            MemorySize = memorySize ?? Args.MemorySize;
             MaxIterations = Args.MaxIterations;
             SgdInitializationTolerance = Args.SgdInitializationTolerance;
             Quiet = Args.Quiet;
@@ -175,7 +201,7 @@ internal LbfgsTrainerBase(IHostEnvironment env, TArgs args, SchemaShape.Column l
             UseThreads = Args.UseThreads;
             NumThreads = Args.NumThreads;
             DenseOptimizer = Args.DenseOptimizer;
-            EnforceNonNegativity = Args.EnforceNonNegativity;
+            EnforceNonNegativity = enforceNoNegativity ?? Args.EnforceNonNegativity;
 
             if (EnforceNonNegativity && ShowTrainingStats)
             {
diff --git a/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LbfgsStatics.cs b/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LbfgsStatics.cs
new file mode 100644
index 0000000000..020a759159
--- /dev/null
+++ b/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LbfgsStatics.cs
@@ -0,0 +1,179 @@
+﻿// Licensed to the .NET Foundation under one or more agreements.
+// The .NET Foundation licenses this file to you under the MIT license.
+// See the LICENSE file in the project root for more information.
+
+using System;
+using Microsoft.ML.Runtime;
+using Microsoft.ML.Runtime.Data;
+using Microsoft.ML.Runtime.Internal.Calibration;
+using Microsoft.ML.Runtime.Learners;
+using Microsoft.ML.Runtime.Training;
+using Microsoft.ML.StaticPipe;
+using Microsoft.ML.StaticPipe.Runtime;
+
+namespace Microsoft.ML.Trainers
+{
+    using Arguments = LogisticRegression.Arguments;
+    /// <summary>
+    /// Extension methods and utilities for instantiating LogisticRegression trainer estimators inside statically typed pipelines.
+    /// </summary>
+    public static class LogisticRegressionStatics
+    {
+        /// <summary>
+        ///  Predict a target using a linear binary classification model trained with the <see cref="Runtime.Learners.LogisticRegression"/> trainer.
+        /// </summary>
+        /// <param name="ctx">The binary classificaiton context trainer object.</param>
+        /// <param name="label">The label, or dependent variable.</param>
+        /// <param name="features">The features, or independent variables.</param>
+        /// <param name="weights">The optional example weights.</param>
+        /// <param name="enoforceNoNegativity">Enforce non-negative weights.</param>
+        /// <param name="l1Weight">Weight of L1 regularizer term.</param>
+        /// <param name="l2Weight">Weight of L2 regularizer term.</param>
+        /// <param name="memorySize">Memory size for <see cref="Runtime.Learners.LogisticRegression"/>. Lower=faster, less accurate.</param>
+        /// <param name="optimizationTolerance">Threshold for optimizer convergence.</param>
+        /// <param name="onFit">A delegate that is called every time the
+        /// <see cref="Estimator{TTupleInShape, TTupleOutShape, TTransformer}.Fit(DataView{TTupleInShape})"/> method is called on the
+        /// <see cref="Estimator{TTupleInShape, TTupleOutShape, TTransformer}"/> instance created out of this. This delegate will receive
+        /// the linear model that was trained.  Note that this action cannot change the result in any way; it is only a way for the caller to
+        /// be informed about what was learnt.</param>
+        /// <returns>The predicted output.</returns>
+        public static (Scalar<float> score, Scalar<float> probability, Scalar<bool> predictedLabel) LogisticRegression(this BinaryClassificationContext.BinaryClassificationTrainers ctx,
+            Scalar<bool> label,
+            Vector<float> features,
+            Scalar<float> weights = null,
+            float l1Weight = Arguments.Defaults.L1Weight,
+            float l2Weight = Arguments.Defaults.L2Weight,
+            float optimizationTolerance = Arguments.Defaults.OptTol,
+            int memorySize = Arguments.Defaults.MemorySize,
+            bool enoforceNoNegativity = Arguments.Defaults.EnforceNonNegativity,
+            Action<ParameterMixingCalibratedPredictor> onFit = null)
+        {
+            ValidateParams(label, features, weights, l1Weight, l2Weight, optimizationTolerance, memorySize, enoforceNoNegativity, onFit);
+
+            var rec = new TrainerEstimatorReconciler.BinaryClassifier(
+                (env, labelName, featuresName, weightsName) =>
+                {
+                    var trainer = new LogisticRegression(env, featuresName, labelName, weightsName,
+                        l1Weight, l2Weight, optimizationTolerance, memorySize, enoforceNoNegativity);
+
+                    if (onFit != null)
+                        return trainer.WithOnFitDelegate(trans => onFit(trans.Model));
+                    return trainer;
+
+                }, label, features, weights);
+
+            return rec.Output;
+        }
+
+        /// <summary>
+        /// Predict a target using a linear regression model trained with the <see cref="Runtime.Learners.LogisticRegression"/> trainer.
+        /// </summary>
+        /// <param name="ctx">The regression context trainer object.</param>
+        /// <param name="label">The label, or dependent variable.</param>
+        /// <param name="features">The features, or independent variables.</param>
+        /// <param name="weights">The optional example weights.</param>
+        /// <param name="enoforceNoNegativity">Enforce non-negative weights.</param>
+        /// <param name="l1Weight">Weight of L1 regularizer term.</param>
+        /// <param name="l2Weight">Weight of L2 regularizer term.</param>
+        /// <param name="memorySize">Memory size for <see cref="Runtime.Learners.LogisticRegression"/>. Lower=faster, less accurate.</param>
+        /// <param name="optimizationTolerance">Threshold for optimizer convergence.</param>
+        /// <param name="onFit">A delegate that is called every time the
+        /// <see cref="Estimator{TTupleInShape, TTupleOutShape, TTransformer}.Fit(DataView{TTupleInShape})"/> method is called on the
+        /// <see cref="Estimator{TTupleInShape, TTupleOutShape, TTransformer}"/> instance created out of this. This delegate will receive
+        /// the linear model that was trained.  Note that this action cannot change the result in any way; it is only a way for the caller to
+        /// be informed about what was learnt.</param>
+        /// <returns>The predicted output.</returns>
+        public static Scalar<float> PoissonRegression(this RegressionContext.RegressionTrainers ctx,
+            Scalar<float> label,
+            Vector<float> features,
+            Scalar<float> weights = null,
+            float l1Weight = Arguments.Defaults.L1Weight,
+            float l2Weight = Arguments.Defaults.L2Weight,
+            float optimizationTolerance = Arguments.Defaults.OptTol,
+            int memorySize = Arguments.Defaults.MemorySize,
+            bool enoforceNoNegativity = Arguments.Defaults.EnforceNonNegativity,
+            Action<PoissonRegressionPredictor> onFit = null)
+        {
+            ValidateParams(label, features, weights, l1Weight, l2Weight, optimizationTolerance, memorySize, enoforceNoNegativity, onFit);
+
+            var rec = new TrainerEstimatorReconciler.Regression(
+                (env, labelName, featuresName, weightsName) =>
+                {
+                    var trainer = new PoissonRegression(env, featuresName, labelName, weightsName,
+                        l1Weight, l2Weight, optimizationTolerance, memorySize, enoforceNoNegativity);
+
+                    if (onFit != null)
+                        return trainer.WithOnFitDelegate(trans => onFit(trans.Model));
+
+                    return trainer;
+                }, label, features, weights);
+
+            return rec.Score;
+        }
+
+        /// <summary>
+        /// Predict a target using a linear multiclass classification model trained with the <see cref="Runtime.Learners.MulticlassLogisticRegression"/> trainer.
+        /// </summary>
+        /// <param name="ctx">The multiclass classification context trainer object.</param>
+        /// <param name="label">The label, or dependent variable.</param>
+        /// <param name="features">The features, or independent variables.</param>
+        /// <param name="weights">The optional example weights.</param>
+        /// <param name="enoforceNoNegativity">Enforce non-negative weights.</param>
+        /// <param name="l1Weight">Weight of L1 regularizer term.</param>
+        /// <param name="l2Weight">Weight of L2 regularizer term.</param>
+        /// <param name="memorySize">Memory size for <see cref="Runtime.Learners.LogisticRegression"/>. Lower=faster, less accurate.</param>
+        /// <param name="optimizationTolerance">Threshold for optimizer convergence.</param>
+        /// <param name="onFit">A delegate that is called every time the
+        /// <see cref="Estimator{TTupleInShape, TTupleOutShape, TTransformer}.Fit(DataView{TTupleInShape})"/> method is called on the
+        /// <see cref="Estimator{TTupleInShape, TTupleOutShape, TTransformer}"/> instance created out of this. This delegate will receive
+        /// the linear model that was trained. Note that this action cannot change the
+        /// result in any way; it is only a way for the caller to be informed about what was learnt.</param>
+        /// <returns>The set of output columns including in order the predicted per-class likelihoods (between 0 and 1, and summing up to 1), and the predicted label.</returns>
+        public static (Vector<float> score, Key<uint, TVal> predictedLabel)
+            MultiClassLogisticRegression<TVal>(this MulticlassClassificationContext.MulticlassClassificationTrainers ctx,
+            Key<uint, TVal> label,
+            Vector<float> features,
+            Scalar<float> weights = null,
+            float l1Weight = Arguments.Defaults.L1Weight,
+            float l2Weight = Arguments.Defaults.L2Weight,
+            float optimizationTolerance = Arguments.Defaults.OptTol,
+            int memorySize = Arguments.Defaults.MemorySize,
+            bool enoforceNoNegativity = Arguments.Defaults.EnforceNonNegativity,
+            Action<MulticlassLogisticRegressionPredictor> onFit = null)
+        {
+            ValidateParams(label, features, weights, l1Weight, l2Weight, optimizationTolerance, memorySize, enoforceNoNegativity, onFit);
+
+            var rec = new TrainerEstimatorReconciler.MulticlassClassifier<TVal>(
+                (env, labelName, featuresName, weightsName) =>
+                {
+                    var trainer = new MulticlassLogisticRegression(env, featuresName, labelName, weightsName,
+                         l1Weight, l2Weight, optimizationTolerance, memorySize, enoforceNoNegativity);
+
+                    if (onFit != null)
+                        return trainer.WithOnFitDelegate(trans => onFit(trans.Model));
+                    return trainer;
+                }, label, features, weights);
+
+            return rec.Output;
+        }
+
+        private static void ValidateParams(PipelineColumn label,
+            Vector<float> features,
+            Scalar<float> weights = null,
+            float l1Weight = Arguments.Defaults.L1Weight,
+            float l2Weight = Arguments.Defaults.L2Weight,
+            float optimizationTolerance = Arguments.Defaults.OptTol,
+            int memorySize = Arguments.Defaults.MemorySize,
+            bool enoforceNoNegativity = Arguments.Defaults.EnforceNonNegativity,
+            Delegate onFit = null)
+        {
+            Contracts.CheckValue(label, nameof(label));
+            Contracts.CheckValue(features, nameof(features));
+            Contracts.CheckParam(l2Weight >= 0, nameof(l2Weight), "Must be non-negative");
+            Contracts.CheckParam(l1Weight >= 0, nameof(l1Weight), "Must be non-negative");
+            Contracts.CheckParam(optimizationTolerance > 0, nameof(optimizationTolerance), "Must be positive");
+            Contracts.CheckParam(memorySize > 0, nameof(memorySize), "Must be positive");
+            Contracts.CheckValueOrNull(onFit);
+        }
+    }
+}
diff --git a/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LogisticRegression.cs b/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LogisticRegression.cs
index 0914c63c33..87c1c1bde9 100644
--- a/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LogisticRegression.cs
+++ b/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LogisticRegression.cs
@@ -54,10 +54,24 @@ public sealed class Arguments : ArgumentsBase
         /// <param name="labelColumn">The name of the label column.</param>
         /// <param name="featureColumn">The name of the feature column.</param>
         /// <param name="weightColumn">The name for the example weight column.</param>
+        /// <param name="enforceNoNegativity">Enforce non-negative weights.</param>
+        /// <param name="l1Weight">Weight of L1 regularizer term.</param>
+        /// <param name="l2Weight">Weight of L2 regularizer term.</param>
+        /// <param name="memorySize">Memory size for <see cref="LogisticRegression"/>. Lower=faster, less accurate.</param>
+        /// <param name="optimizationTolerance">Threshold for optimizer convergence.</param>
         /// <param name="advancedSettings">A delegate to apply all the advanced arguments to the algorithm.</param>
-        public LogisticRegression(IHostEnvironment env, string featureColumn, string labelColumn,
-            string weightColumn = null, Action<Arguments> advancedSettings = null)
-            : base(env, featureColumn, TrainerUtils.MakeR4ScalarLabel(labelColumn), weightColumn, advancedSettings)
+        public LogisticRegression(IHostEnvironment env,
+            string featureColumn,
+            string labelColumn,
+            string weightColumn = null,
+            float l1Weight = Arguments.Defaults.L1Weight,
+            float l2Weight = Arguments.Defaults.L2Weight,
+            float optimizationTolerance = Arguments.Defaults.OptTol,
+            int memorySize = Arguments.Defaults.MemorySize,
+            bool enforceNoNegativity = Arguments.Defaults.EnforceNonNegativity,
+            Action<Arguments> advancedSettings = null)
+            : base(env, featureColumn, TrainerUtils.MakeBoolScalarLabel(labelColumn), weightColumn, advancedSettings,
+                  l1Weight, l2Weight,  optimizationTolerance, memorySize, enforceNoNegativity)
         {
             Host.CheckNonEmpty(featureColumn, nameof(featureColumn));
             Host.CheckNonEmpty(labelColumn, nameof(labelColumn));
@@ -70,7 +84,7 @@ public LogisticRegression(IHostEnvironment env, string featureColumn, string lab
         /// Initializes a new instance of <see cref="LogisticRegression"/>
         /// </summary>
         internal LogisticRegression(IHostEnvironment env, Arguments args)
-            : base(env, args, TrainerUtils.MakeR4ScalarLabel(args.LabelColumn))
+            : base(env, args, TrainerUtils.MakeBoolScalarLabel(args.LabelColumn))
         {
             _posWeight = 0;
             ShowTrainingStats = Args.ShowTrainingStats;
diff --git a/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/MulticlassLogisticRegression.cs b/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/MulticlassLogisticRegression.cs
index 52d1688638..40e3090c74 100644
--- a/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/MulticlassLogisticRegression.cs
+++ b/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/MulticlassLogisticRegression.cs
@@ -76,10 +76,22 @@ public sealed class Arguments : ArgumentsBase
         /// <param name="labelColumn">The name of the label column.</param>
         /// <param name="featureColumn">The name of the feature column.</param>
         /// <param name="weightColumn">The name for the example weight column.</param>
+        /// <param name="enforceNoNegativity">Enforce non-negative weights.</param>
+        /// <param name="l1Weight">Weight of L1 regularizer term.</param>
+        /// <param name="l2Weight">Weight of L2 regularizer term.</param>
+        /// <param name="memorySize">Memory size for <see cref="LogisticRegression"/>. Lower=faster, less accurate.</param>
+        /// <param name="optimizationTolerance">Threshold for optimizer convergence.</param>
         /// <param name="advancedSettings">A delegate to apply all the advanced arguments to the algorithm.</param>
         public MulticlassLogisticRegression(IHostEnvironment env, string featureColumn, string labelColumn,
-            string weightColumn = null, Action<Arguments> advancedSettings = null)
-            : base(env, featureColumn, TrainerUtils.MakeU4ScalarLabel(labelColumn), weightColumn, advancedSettings)
+            string weightColumn = null,
+            float l1Weight = Arguments.Defaults.L1Weight,
+            float l2Weight = Arguments.Defaults.L2Weight,
+            float optimizationTolerance = Arguments.Defaults.OptTol,
+            int memorySize = Arguments.Defaults.MemorySize,
+            bool enforceNoNegativity = Arguments.Defaults.EnforceNonNegativity,
+            Action<Arguments> advancedSettings = null)
+            : base(env, featureColumn, TrainerUtils.MakeU4ScalarLabel(labelColumn), weightColumn, advancedSettings,
+                  l1Weight, l2Weight, optimizationTolerance, memorySize, enforceNoNegativity)
         {
             Host.CheckNonEmpty(featureColumn, nameof(featureColumn));
             Host.CheckNonEmpty(labelColumn, nameof(labelColumn));
diff --git a/src/Microsoft.ML.StandardLearners/Standard/PoissonRegression/PoissonRegression.cs b/src/Microsoft.ML.StandardLearners/Standard/PoissonRegression/PoissonRegression.cs
index ed400aaeac..2e703bf4a0 100644
--- a/src/Microsoft.ML.StandardLearners/Standard/PoissonRegression/PoissonRegression.cs
+++ b/src/Microsoft.ML.StandardLearners/Standard/PoissonRegression/PoissonRegression.cs
@@ -46,10 +46,22 @@ public sealed class Arguments : ArgumentsBase
         /// <param name="labelColumn">The name of the label column.</param>
         /// <param name="featureColumn">The name of the feature column.</param>
         /// <param name="weightColumn">The name for the example weight column.</param>
+        /// <param name="enforceNoNegativity">Enforce non-negative weights.</param>
+        /// <param name="l1Weight">Weight of L1 regularizer term.</param>
+        /// <param name="l2Weight">Weight of L2 regularizer term.</param>
+        /// <param name="memorySize">Memory size for <see cref="LogisticRegression"/>. Lower=faster, less accurate.</param>
+        /// <param name="optimizationTolerance">Threshold for optimizer convergence.</param>
         /// <param name="advancedSettings">A delegate to apply all the advanced arguments to the algorithm.</param>
         public PoissonRegression(IHostEnvironment env, string featureColumn, string labelColumn,
-            string weightColumn = null, Action<Arguments> advancedSettings = null)
-            : base(env, featureColumn, TrainerUtils.MakeR4ScalarLabel(labelColumn), weightColumn, advancedSettings)
+            string weightColumn = null,
+            float l1Weight = Arguments.Defaults.L1Weight,
+            float l2Weight = Arguments.Defaults.L2Weight,
+            float optimizationTolerance = Arguments.Defaults.OptTol,
+            int memorySize = Arguments.Defaults.MemorySize,
+            bool enforceNoNegativity = Arguments.Defaults.EnforceNonNegativity,
+            Action<Arguments> advancedSettings = null)
+            : base(env, featureColumn, TrainerUtils.MakeR4ScalarLabel(labelColumn), weightColumn, advancedSettings,
+                   l1Weight, l2Weight, optimizationTolerance, memorySize, enforceNoNegativity)
         {
             Host.CheckNonEmpty(featureColumn, nameof(featureColumn));
             Host.CheckNonEmpty(labelColumn, nameof(labelColumn));
diff --git a/test/Microsoft.ML.StaticPipelineTesting/Training.cs b/test/Microsoft.ML.StaticPipelineTesting/Training.cs
index b7bf2606d4..11635fe3d3 100644
--- a/test/Microsoft.ML.StaticPipelineTesting/Training.cs
+++ b/test/Microsoft.ML.StaticPipelineTesting/Training.cs
@@ -528,5 +528,128 @@ public void LightGbmRegression()
             Assert.Equal(metrics.Rms * metrics.Rms, metrics.L2, 5);
             Assert.InRange(metrics.LossFn, 0, double.PositiveInfinity);
         }
+
+        [Fact]
+        public void PoissonRegression()
+        {
+            var env = new ConsoleEnvironment(seed: 0);
+            var dataPath = GetDataPath(TestDatasets.generatedRegressionDataset.trainFilename);
+            var dataSource = new MultiFileSource(dataPath);
+
+            var ctx = new RegressionContext(env);
+
+            var reader = TextLoader.CreateReader(env,
+                c => (label: c.LoadFloat(11), features: c.LoadFloat(0, 10)),
+                separator: ';', hasHeader: true);
+
+            PoissonRegressionPredictor pred = null;
+
+            var est = reader.MakeNewEstimator()
+                .Append(r => (r.label, score: ctx.Trainers.PoissonRegression(r.label, r.features,
+                    l1Weight: 2,
+                    enoforceNoNegativity: true,
+                    onFit: (p) => { pred = p; })));
+
+            var pipe = reader.Append(est);
+
+            Assert.Null(pred);
+            var model = pipe.Fit(dataSource);
+            Assert.NotNull(pred);
+            // 11 input features, so we ought to have 11 weights.
+            VBuffer<float> weights = new VBuffer<float>();
+            pred.GetFeatureWeights(ref weights);
+            Assert.Equal(11, weights.Length);
+
+            var data = model.Read(dataSource);
+
+            var metrics = ctx.Evaluate(data, r => r.label, r => r.score, new PoissonLoss());
+            // Run a sanity check against a few of the metrics.
+            Assert.InRange(metrics.L1, 0, double.PositiveInfinity);
+            Assert.InRange(metrics.L2, 0, double.PositiveInfinity);
+            Assert.InRange(metrics.Rms, 0, double.PositiveInfinity);
+            Assert.Equal(metrics.Rms * metrics.Rms, metrics.L2, 5);
+            Assert.InRange(metrics.LossFn, 0, double.PositiveInfinity);
+        }
+
+        [Fact]
+        public void LogisticRegression()
+        {
+            var env = new ConsoleEnvironment(seed: 0);
+            var dataPath = GetDataPath(TestDatasets.breastCancer.trainFilename);
+            var dataSource = new MultiFileSource(dataPath);
+            var ctx = new BinaryClassificationContext(env);
+
+            var reader = TextLoader.CreateReader(env,
+                c => (label: c.LoadBool(0), features: c.LoadFloat(1, 9)));
+
+            IPredictorWithFeatureWeights<float> pred = null;
+
+            var est = reader.MakeNewEstimator()
+                .Append(r => (r.label, preds: ctx.Trainers.LogisticRegression(r.label, r.features,
+                    l1Weight: 10,
+                    onFit: (p) => { pred = p; })));
+
+            var pipe = reader.Append(est);
+
+            Assert.Null(pred);
+            var model = pipe.Fit(dataSource);
+            Assert.NotNull(pred);
+
+            // 9 input features, so we ought to have 9 weights.
+            VBuffer<float> weights = new VBuffer<float>();
+            pred.GetFeatureWeights(ref weights);
+            Assert.Equal(9, weights.Length);
+
+            var data = model.Read(dataSource);
+
+            var metrics = ctx.Evaluate(data, r => r.label, r => r.preds);
+            // Run a sanity check against a few of the metrics.
+            Assert.InRange(metrics.Accuracy, 0, 1);
+            Assert.InRange(metrics.Auc, 0, 1);
+            Assert.InRange(metrics.Auprc, 0, 1);
+        }
+
+        [Fact]
+        public void MulticlassLogisticRegression()
+        {
+            var env = new ConsoleEnvironment(seed: 0);
+            var dataPath = GetDataPath(TestDatasets.iris.trainFilename);
+            var dataSource = new MultiFileSource(dataPath);
+
+            var ctx = new MulticlassClassificationContext(env);
+            var reader = TextLoader.CreateReader(env,
+                c => (label: c.LoadText(0), features: c.LoadFloat(1, 4)));
+
+            MulticlassLogisticRegressionPredictor pred = null;
+
+            // With a custom loss function we no longer get calibrated predictions.
+            var est = reader.MakeNewEstimator()
+                .Append(r => (label: r.label.ToKey(), r.features))
+                .Append(r => (r.label, preds: ctx.Trainers.MultiClassLogisticRegression(
+                    r.label,
+                    r.features, onFit: p => pred = p)));
+
+            var pipe = reader.Append(est);
+
+            Assert.Null(pred);
+            var model = pipe.Fit(dataSource);
+            Assert.NotNull(pred);
+            VBuffer<float>[] weights = default;
+            pred.GetWeights(ref weights, out int n);
+            Assert.True(n == 3 && n == weights.Length);
+            foreach (var w in weights)
+                Assert.True(w.Length == 4);
+
+            var data = model.Read(dataSource);
+
+            // Just output some data on the schema for fun.
+            var schema = data.AsDynamic.Schema;
+            for (int c = 0; c < schema.ColumnCount; ++c)
+                Console.WriteLine($"{schema.GetColumnName(c)}, {schema.GetColumnType(c)}");
+
+            var metrics = ctx.Evaluate(data, r => r.label, r => r.preds, 2);
+            Assert.True(metrics.LogLoss > 0);
+            Assert.True(metrics.TopKAccuracy > 0);
+        }
     }
 }
diff --git a/test/Microsoft.ML.Tests/TrainerEstimators/LbfgsTests.cs b/test/Microsoft.ML.Tests/TrainerEstimators/LbfgsTests.cs
index 8d4f29591f..fb54ad52ce 100644
--- a/test/Microsoft.ML.Tests/TrainerEstimators/LbfgsTests.cs
+++ b/test/Microsoft.ML.Tests/TrainerEstimators/LbfgsTests.cs
@@ -3,11 +3,8 @@
 // See the LICENSE file in the project root for more information.
 
 using Microsoft.ML.Core.Data;
-using Microsoft.ML.Runtime;
 using Microsoft.ML.Runtime.Data;
-using Microsoft.ML.Runtime.EntryPoints;
 using Microsoft.ML.Runtime.Learners;
-using Microsoft.ML.Runtime.RunTests;
 using Xunit;
 
 namespace Microsoft.ML.Tests.TrainerEstimators

From 60df43c768388c50ee6ac056ab98ffc91200bdce Mon Sep 17 00:00:00 2001
From: Senja Filipi <sefilipi@microsoft.com>
Date: Thu, 27 Sep 2018 16:56:19 -0700
Subject: [PATCH 03/10] Ogd static xtensions. Removing the AP xtension that
 produces the probability column.

---
 .../Regression/RegressionEnsembleTrainer.cs   |  2 +-
 .../Standard/Online/AveragedLinear.cs         |  8 +-
 .../Standard/Online/AveragedPerceptron.cs     |  3 +-
 .../Standard/Online/OnlineGradientDescent.cs  | 62 ++++++++++---
 .../Standard/Online/OnlineLearnerStatic.cs    | 84 ++++++------------
 .../Standard/Online/OnlineLinear.cs           | 18 +---
 .../Training.cs                               | 86 ++++++++++---------
 .../TrainerEstimators/OnlineLinearTests.cs    |  2 +-
 8 files changed, 130 insertions(+), 135 deletions(-)

diff --git a/src/Microsoft.ML.Ensemble/Trainer/Regression/RegressionEnsembleTrainer.cs b/src/Microsoft.ML.Ensemble/Trainer/Regression/RegressionEnsembleTrainer.cs
index 3fe853aff5..344adbe39f 100644
--- a/src/Microsoft.ML.Ensemble/Trainer/Regression/RegressionEnsembleTrainer.cs
+++ b/src/Microsoft.ML.Ensemble/Trainer/Regression/RegressionEnsembleTrainer.cs
@@ -51,7 +51,7 @@ public Arguments()
                 BasePredictors = new[]
                 {
                     ComponentFactoryUtils.CreateFromFunction(
-                        env => new OnlineGradientDescentTrainer(env, new OnlineGradientDescentTrainer.Arguments()))
+                        env => new OnlineGradientDescentTrainer(env, DefaultColumnNames.Label, DefaultColumnNames.Features))
                 };
             }
         }
diff --git a/src/Microsoft.ML.StandardLearners/Standard/Online/AveragedLinear.cs b/src/Microsoft.ML.StandardLearners/Standard/Online/AveragedLinear.cs
index c2656bd6f5..5871c932dd 100644
--- a/src/Microsoft.ML.StandardLearners/Standard/Online/AveragedLinear.cs
+++ b/src/Microsoft.ML.StandardLearners/Standard/Online/AveragedLinear.cs
@@ -22,12 +22,12 @@ public abstract class AveragedLinearArguments : OnlineLinearArguments
         [Argument(ArgumentType.AtMostOnce, HelpText = "Learning rate", ShortName = "lr", SortOrder = 50)]
         [TGUI(Label = "Learning rate", SuggestedSweeps = "0.01,0.1,0.5,1.0")]
         [TlcModule.SweepableDiscreteParam("LearningRate", new object[] { 0.01, 0.1, 0.5, 1.0 })]
-        public Float LearningRate = DefaultAveragedArgs.LearningRate;
+        public Float LearningRate = AveragedDefaultArgs.LearningRate;
 
         [Argument(ArgumentType.AtMostOnce, HelpText = "Decrease learning rate", ShortName = "decreaselr", SortOrder = 50)]
         [TGUI(Label = "Decrease Learning Rate", Description = "Decrease learning rate as iterations progress")]
         [TlcModule.SweepableDiscreteParam("DecreaseLearningRate", new object[] { false, true })]
-        public bool DecreaseLearningRate = DefaultAveragedArgs.DecreaseLearningRate;
+        public bool DecreaseLearningRate = AveragedDefaultArgs.DecreaseLearningRate;
 
         [Argument(ArgumentType.AtMostOnce, HelpText = "Number of examples after which weights will be reset to the current average", ShortName = "numreset")]
         public long? ResetWeightsAfterXExamples = null;
@@ -38,7 +38,7 @@ public abstract class AveragedLinearArguments : OnlineLinearArguments
         [Argument(ArgumentType.AtMostOnce, HelpText = "L2 Regularization Weight", ShortName = "reg", SortOrder = 50)]
         [TGUI(Label = "L2 Regularization Weight")]
         [TlcModule.SweepableFloatParam("L2RegularizerWeight", 0.0f, 0.4f)]
-        public Float L2RegularizerWeight = DefaultAveragedArgs.L2RegularizerWeight;
+        public Float L2RegularizerWeight = AveragedDefaultArgs.L2RegularizerWeight;
 
         [Argument(ArgumentType.AtMostOnce, HelpText = "Extra weight given to more recent updates", ShortName = "rg")]
         public Float RecencyGain = 0;
@@ -52,7 +52,7 @@ public abstract class AveragedLinearArguments : OnlineLinearArguments
         [Argument(ArgumentType.AtMostOnce, HelpText = "The inexactness tolerance for averaging", ShortName = "avgtol")]
         public Float AveragedTolerance = (Float)1e-2;
 
-        internal static class DefaultAveragedArgs
+        internal class AveragedDefaultArgs : OnlineDefaultArgs
         {
             internal const Float LearningRate = 1;
             internal const bool DecreaseLearningRate = false;
diff --git a/src/Microsoft.ML.StandardLearners/Standard/Online/AveragedPerceptron.cs b/src/Microsoft.ML.StandardLearners/Standard/Online/AveragedPerceptron.cs
index 4862caa4d6..8cbb1978a5 100644
--- a/src/Microsoft.ML.StandardLearners/Standard/Online/AveragedPerceptron.cs
+++ b/src/Microsoft.ML.StandardLearners/Standard/Online/AveragedPerceptron.cs
@@ -67,9 +67,8 @@ protected override SchemaShape.Column[] GetOutputColumnsCore(SchemaShape inputSc
         {
             return new[]
             {
+                // REVIEW AP is currently not calibrating. Add the probability column after fixing the behavior.
                 new SchemaShape.Column(DefaultColumnNames.Score, SchemaShape.Column.VectorKind.Scalar, NumberType.R4, false, new SchemaShape(MetadataUtils.GetTrainerOutputMetadata())),
-                //sefilipi: should it be here, since NeedCalibration is true?
-                new SchemaShape.Column(DefaultColumnNames.Probability, SchemaShape.Column.VectorKind.Scalar, NumberType.R4, false, new SchemaShape(MetadataUtils.GetTrainerOutputMetadata(true))),
                 new SchemaShape.Column(DefaultColumnNames.PredictedLabel, SchemaShape.Column.VectorKind.Scalar, BoolType.Instance, false, new SchemaShape(MetadataUtils.GetTrainerOutputMetadata()))
             };
         }
diff --git a/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineGradientDescent.cs b/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineGradientDescent.cs
index 768bb1da75..b9b4a6b11c 100644
--- a/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineGradientDescent.cs
+++ b/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineGradientDescent.cs
@@ -46,27 +46,69 @@ public sealed class Arguments : AveragedLinearArguments
             /// </summary>
             public Arguments()
             {
-                LearningRate = (Float)0.1;
-                DecreaseLearningRate = true;
+                LearningRate = OgdDefaultArgs.LearningRate;
+                DecreaseLearningRate = OgdDefaultArgs.DecreaseLearningRate;
             }
+
+            internal class OgdDefaultArgs : AveragedDefaultArgs
+            {
+               internal new const float LearningRate = 0.1f;
+               internal new const bool DecreaseLearningRate = true;
+            }
+        }
+
+        /// <summary>
+        /// Trains a new <see cref="RegressionPredictionTransformer{LinearRegressionPredictor}"/>.
+        /// </summary>
+        /// <param name="env">The pricate instance of <see cref="IHostEnvironment"/>.</param>
+        /// <param name="labelColumn">Name of the label column.</param>
+        /// <param name="featureColumn">Name of the feature column.</param>
+        /// <param name="learningRate">The learning Rate.</param>
+        /// <param name="decreaseLearningRate">Decrease learning rate as iterations progress.</param>
+        /// <param name="l2RegularizerWeight">L2 Regularization Weight.</param>
+        /// <param name="numIterations">Number of training iterations through the data.</param>
+        /// <param name="weightsColumn">The name of the weights column.</param>
+        /// <param name="lossFunction">The custom loss functions. Defaults to <see cref="SquaredLoss"/> if not provided.</param>
+        public OnlineGradientDescentTrainer(IHostEnvironment env,
+            string labelColumn,
+            string featureColumn,
+            float learningRate = Arguments.OgdDefaultArgs.LearningRate,
+            bool decreaseLearningRate =Arguments.OgdDefaultArgs.DecreaseLearningRate,
+            float l2RegularizerWeight = Arguments.OgdDefaultArgs.L2RegularizerWeight,
+            int numIterations = Arguments.OgdDefaultArgs.NumIterations,
+            string weightsColumn = null,
+            IRegressionLoss lossFunction = null)
+            : base(new Arguments
+            {
+                LearningRate = learningRate,
+                DecreaseLearningRate = decreaseLearningRate,
+                L2RegularizerWeight = l2RegularizerWeight,
+                NumIterations = numIterations,
+                LabelColumn = labelColumn,
+                FeatureColumn = featureColumn,
+                InitialWeights = weightsColumn
+
+            }, env, UserNameValue, TrainerUtils.MakeR4ScalarLabel(labelColumn))
+        {
+            LossFunction = lossFunction ?? new SquaredLoss();
         }
 
-        public OnlineGradientDescentTrainer(IHostEnvironment env, Arguments args)
-            : base(args, env, UserNameValue, TrainerUtils.MakeR4ScalarLabel(args.LabelColumn))
+        internal OnlineGradientDescentTrainer(IHostEnvironment env, Arguments args)
+        : base(args, env, UserNameValue, TrainerUtils.MakeR4ScalarLabel(args.LabelColumn))
         {
             LossFunction = args.LossFunction.CreateComponent(env);
+        }
+
+        public override PredictionKind PredictionKind => PredictionKind.Regression;
 
-            _outputColumns = new[]
+        protected override SchemaShape.Column[] GetOutputColumnsCore(SchemaShape inputSchema)
+        {
+            return new[]
             {
                 new SchemaShape.Column(DefaultColumnNames.Score, SchemaShape.Column.VectorKind.Scalar, NumberType.R4, false, new SchemaShape(MetadataUtils.GetTrainerOutputMetadata()))
             };
         }
 
-        public override PredictionKind PredictionKind => PredictionKind.Regression;
-
-        private readonly SchemaShape.Column[] _outputColumns;
-        protected override SchemaShape.Column[] GetOutputColumnsCore(SchemaShape inputSchema) => _outputColumns;
-
         protected override void CheckLabel(RoleMappedData data)
         {
             data.CheckRegressionLabel();
diff --git a/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs b/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs
index afa2790821..82e98f6067 100644
--- a/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs
+++ b/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs
@@ -40,10 +40,10 @@ public static (Scalar<float> score, Scalar<bool> predictedLabel) AveragedPercept
                 this BinaryClassificationContext.BinaryClassificationTrainers ctx,
                 IClassificationLoss lossFunction,
                 Scalar<bool> label, Vector<float> features, Scalar<float> weights = null,
-                float learningRate = AveragedLinearArguments.DefaultAveragedArgs.LearningRate,
-                bool decreaseLearningRate = AveragedLinearArguments.DefaultAveragedArgs.DecreaseLearningRate,
-                float l2RegularizerWeight = AveragedLinearArguments.DefaultAveragedArgs.L2RegularizerWeight,
-                int numIterations = OnlineLinearArguments.DefaultArgs.NumIterations,
+                float learningRate = AveragedLinearArguments.AveragedDefaultArgs.LearningRate,
+                bool decreaseLearningRate = AveragedLinearArguments.AveragedDefaultArgs.DecreaseLearningRate,
+                float l2RegularizerWeight = AveragedLinearArguments.AveragedDefaultArgs.L2RegularizerWeight,
+                int numIterations = AveragedLinearArguments.AveragedDefaultArgs.NumIterations,
                 Action<LinearBinaryPredictor> onFit = null
             )
         {
@@ -105,15 +105,13 @@ public static (Scalar<float> score, Scalar<bool> predictedLabel) AveragedPercept
         }
 
         /// <summary>
-        /// Predict a target using a linear binary classification model trained with the AveragePerceptron trainer, and a custom loss.
-        /// Note that because we cannot be sure that all loss functions will produce naturally calibrated outputs, setting
-        /// a custom loss function will not produce a calibrated probability column.
+        /// Predict a target using a linear regression model trained with the <see cref="Runtime.Learners.OnlineGradientDescentTrainer"/> trainer.
         /// </summary>
-        /// <param name="ctx">The binary classification context trainer object.</param>
+        /// <param name="ctx">The regression context trainer object.</param>
         /// <param name="label">The label, or dependent variable.</param>
         /// <param name="features">The features, or independent variables.</param>
         /// <param name="weights">The optional example weights.</param>
-        /// <param name="lossFunction">The custom loss.</param>
+        /// <param name="lossFunction">The custom loss. Defaults to <see cref="SquaredLoss"/> if not provided.</param>
         /// <param name="learningRate">The learning Rate.</param>
         /// <param name="decreaseLearningRate">Decrease learning rate as iterations progress.</param>
         /// <param name="l2RegularizerWeight">L2 Regularization Weight.</param>
@@ -125,66 +123,32 @@ public static (Scalar<float> score, Scalar<bool> predictedLabel) AveragedPercept
         /// result in any way; it is only a way for the caller to be informed about what was learnt.</param>
         /// <returns>The set of output columns including in order the predicted binary classification score (which will range
         /// from negative to positive infinity), and the predicted label.</returns>
-        /// <seealso cref="AveragedPerceptronTrainer"/>.
-        /// <returns>The set of output columns including in order the predicted per-class likelihoods (between 0 and 1, and summing up to 1), and the predicted label.</returns>
-        public static (Scalar<float> score, Scalar<float> probability, Scalar<bool> predictedLabel)
-            AveragedPerceptron(this BinaryClassificationContext.BinaryClassificationTrainers ctx,
-                Scalar<bool> label,
-                Vector<float> features,
-                IClassificationLoss lossFunction = null,
-                Scalar<float> weights = null,
-                float learningRate = AveragedLinearArguments.DefaultAveragedArgs.LearningRate,
-                bool decreaseLearningRate = AveragedLinearArguments.DefaultAveragedArgs.DecreaseLearningRate,
-                float l2RegularizerWeight = AveragedLinearArguments.DefaultAveragedArgs.L2RegularizerWeight,
-                int numIterations = OnlineLinearArguments.DefaultArgs.NumIterations,
-                Action<LinearBinaryPredictor> onFit = null)
+        /// <seealso cref="OnlineGradientDescentTrainer"/>.
+        /// <returns>The predicted output.</returns>
+        public static Scalar<float> OnlineGradientDescent(this RegressionContext.RegressionTrainers ctx,
+            Scalar<float> label,
+            Vector<float> features,
+            Scalar<float> weights = null,
+            IRegressionLoss lossFunction = null,
+            float learningRate = OnlineGradientDescentTrainer.Arguments.OgdDefaultArgs.LearningRate,
+            bool decreaseLearningRate = OnlineGradientDescentTrainer.Arguments.OgdDefaultArgs.DecreaseLearningRate,
+            float l2RegularizerWeight = OnlineGradientDescentTrainer.Arguments.OgdDefaultArgs.L2RegularizerWeight,
+            int numIterations = OnlineGradientDescentTrainer.Arguments.OgdDefaultArgs.NumIterations,
+            Action<LinearRegressionPredictor> onFit = null)
         {
-            Contracts.CheckValue(label, nameof(label));
-            Contracts.CheckValue(features, nameof(features));
-            Contracts.CheckValueOrNull(weights);
-            Contracts.CheckParam(learningRate > 0, nameof(learningRate), "Must be positive.");
-            Contracts.CheckParam(0 <= l2RegularizerWeight && l2RegularizerWeight < 0.5, nameof(l2RegularizerWeight), "must be in range [0, 0.5)");
-
-            Contracts.CheckParam(numIterations > 1, nameof(numIterations), "Must be greater than one, if specified.");
-            Contracts.CheckValueOrNull(onFit);
-
-            var args = new AveragedPerceptronTrainer.Arguments()
-            {
-                LearningRate = learningRate,
-                DecreaseLearningRate = decreaseLearningRate,
-                L2RegularizerWeight = l2RegularizerWeight,
-                NumIterations = numIterations
-            };
-
-            if (lossFunction != null)
-                args.LossFunction = new TrivialClassificationLossFactory(lossFunction);
-
-            var rec = new TrainerEstimatorReconciler.BinaryClassifier(
+            var rec = new TrainerEstimatorReconciler.Regression(
                 (env, labelName, featuresName, weightsName) =>
                 {
-                    args.FeatureColumn = featuresName;
-                    args.LabelColumn = labelName;
-                    args.InitialWeights = weightsName;
+                    var trainer = new OnlineGradientDescentTrainer(env, labelName, featuresName, learningRate,
+                        decreaseLearningRate, l2RegularizerWeight, numIterations, weightsName, lossFunction);
 
-                    var trainer = new AveragedPerceptronTrainer(env, args);
                     if (onFit != null)
-                    {
                         return trainer.WithOnFitDelegate(trans => onFit(trans.Model));
-                        /*
-                        return trainer.WithOnFitDelegate(trans =>
-                        {
-                            // Under the default log-loss we assume a calibrated predictor.
-                            var model = trans.Model;
-                            var cali = (ParameterMixingCalibratedPredictor)model;
-                            var pred = (LinearBinaryPredictor)cali.SubPredictor;
-                            onFit(pred, cali);
-                        });
-                        */
-                    }
+
                     return trainer;
                 }, label, features, weights);
 
-            return rec.Output;
+            return rec.Score;
         }
 
         private sealed class TrivialClassificationLossFactory : ISupportClassificationLossFactory
diff --git a/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLinear.cs b/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLinear.cs
index fb28bfe23a..41bf4a421a 100644
--- a/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLinear.cs
+++ b/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLinear.cs
@@ -24,7 +24,7 @@ public abstract class OnlineLinearArguments : LearnerInputBaseWithLabel
         [Argument(ArgumentType.AtMostOnce, HelpText = "Number of iterations", ShortName = "iter", SortOrder = 50)]
         [TGUI(Label = "Number of Iterations", Description = "Number of training iterations through data", SuggestedSweeps = "1,10,100")]
         [TlcModule.SweepableLongParamAttribute("NumIterations", 1, 100, stepSize: 10, isLogScale: true)]
-        public int NumIterations = DefaultArgs.NumIterations;
+        public int NumIterations = OnlineDefaultArgs.NumIterations;
 
         [Argument(ArgumentType.AtMostOnce, HelpText = "Initial Weights and bias, comma-separated", ShortName = "initweights")]
         [TGUI(NoSweep = true)]
@@ -42,7 +42,7 @@ public abstract class OnlineLinearArguments : LearnerInputBaseWithLabel
         [Argument(ArgumentType.AtMostOnce, HelpText = "Size of cache when trained in Scope", ShortName = "cache")]
         public int StreamingCacheSize = 1000000;
 
-        internal static class DefaultArgs
+        internal class OnlineDefaultArgs
         {
             internal const int NumIterations = 1;
         }
@@ -83,7 +83,7 @@ public abstract class OnlineLinearTrainer<TTransformer, TModel> : TrainerEstimat
         protected virtual bool NeedCalibration => false;
 
         protected OnlineLinearTrainer(OnlineLinearArguments args, IHostEnvironment env, string name, SchemaShape.Column label)
-            : base(Contracts.CheckRef(env, nameof(env)).Register(name), MakeFeatureColumn(args.FeatureColumn), label, MakeWeightColumn(args.InitialWeights))
+            : base(Contracts.CheckRef(env, nameof(env)).Register(name), TrainerUtils.MakeR4VecFeature(args.FeatureColumn), label, TrainerUtils.MakeR4ScalarWeightColumn(args.InitialWeights))
         {
             Contracts.CheckValue(args, nameof(args));
             Contracts.CheckUserArg(args.NumIterations > 0, nameof(args.NumIterations), UserErrorPositive);
@@ -161,18 +161,6 @@ protected override TModel TrainModelCore(TrainContext context)
 
         protected abstract void CheckLabel(RoleMappedData data);
 
-        private static SchemaShape.Column MakeWeightColumn(string weightColumn)
-        {
-            if (weightColumn == null)
-                return null;
-            return new SchemaShape.Column(weightColumn, SchemaShape.Column.VectorKind.Scalar, NumberType.R4, false);
-        }
-
-        private static SchemaShape.Column MakeFeatureColumn(string featureColumn)
-        {
-            return new SchemaShape.Column(featureColumn, SchemaShape.Column.VectorKind.Vector, NumberType.R4, false);
-        }
-
         protected virtual void TrainCore(IChannel ch, RoleMappedData data)
         {
             bool shuffle = Args.Shuffle;
diff --git a/test/Microsoft.ML.StaticPipelineTesting/Training.cs b/test/Microsoft.ML.StaticPipelineTesting/Training.cs
index 11635fe3d3..7a8540414e 100644
--- a/test/Microsoft.ML.StaticPipelineTesting/Training.cs
+++ b/test/Microsoft.ML.StaticPipelineTesting/Training.cs
@@ -186,46 +186,6 @@ public void SdcaBinaryClassificationNoCalibration()
                 Console.WriteLine($"{schema.GetColumnName(c)}, {schema.GetColumnType(c)}");
         }
 
-        [Fact]
-        public void AveragePerceptron()
-        {
-            var env = new ConsoleEnvironment(seed: 0);
-            var dataPath = GetDataPath(TestDatasets.breastCancer.trainFilename);
-            var dataSource = new MultiFileSource(dataPath);
-            var ctx = new BinaryClassificationContext(env);
-
-            var reader = TextLoader.CreateReader(env,
-                c => (label: c.LoadBool(0), features: c.LoadFloat(1, 9)));
-
-            LinearBinaryPredictor pred = null;
-            // ParameterMixingCalibratedPredictor cali = null;
-
-            var est = reader.MakeNewEstimator()
-                .Append(r => (r.label, preds: ctx.Trainers.AveragedPerceptron(r.label, r.features,
-                    numIterations: 2,
-                    onFit: (p) => { pred = p; })));
-
-            var pipe = reader.Append(est);
-
-            Assert.Null(pred);
-            //Assert.Null(cali);
-            var model = pipe.Fit(dataSource);
-            Assert.NotNull(pred);
-            //Assert.NotNull(cali);
-            // 9 input features, so we ought to have 9 weights.
-            Assert.Equal(9, pred.Weights2.Count);
-
-            var data = model.Read(dataSource);
-
-            var metrics = ctx.Evaluate(data, r => r.label, r => r.preds);
-            // Run a sanity check against a few of the metrics.
-            Assert.InRange(metrics.Accuracy, 0, 1);
-            Assert.InRange(metrics.Auc, 0, 1);
-            Assert.InRange(metrics.Auprc, 0, 1);
-            Assert.InRange(metrics.LogLoss, 0, double.PositiveInfinity);
-            Assert.InRange(metrics.Entropy, 0, double.PositiveInfinity);
-        }
-
         [Fact]
         public void AveragePerceptronNoCalibration()
         {
@@ -241,7 +201,6 @@ public void AveragePerceptronNoCalibration()
 
             var loss = new HingeLoss(new HingeLoss.Arguments() { Margin = 1 });
 
-            // With a custom loss function we no longer get calibrated predictions.
             var est = reader.MakeNewEstimator()
                 .Append(r => (r.label, preds: ctx.Trainers.AveragedPerceptron(loss, r.label, r.features,
                 numIterations: 2, onFit: p => pred = p)));
@@ -572,7 +531,7 @@ public void PoissonRegression()
         }
 
         [Fact]
-        public void LogisticRegression()
+        public void LogisticRegressionBinaryClassification()
         {
             var env = new ConsoleEnvironment(seed: 0);
             var dataPath = GetDataPath(TestDatasets.breastCancer.trainFilename);
@@ -651,5 +610,48 @@ public void MulticlassLogisticRegression()
             Assert.True(metrics.LogLoss > 0);
             Assert.True(metrics.TopKAccuracy > 0);
         }
+
+        [Fact]
+        public void OnlineGradientDescent()
+        {
+            var env = new ConsoleEnvironment(seed: 0);
+            var dataPath = GetDataPath(TestDatasets.generatedRegressionDataset.trainFilename);
+            var dataSource = new MultiFileSource(dataPath);
+
+            var ctx = new RegressionContext(env);
+
+            var reader = TextLoader.CreateReader(env,
+                c => (label: c.LoadFloat(11), features: c.LoadFloat(0, 10)),
+                separator: ';', hasHeader: true);
+
+            LinearRegressionPredictor pred = null;
+
+            var loss = new SquaredLoss();
+
+            var est = reader.MakeNewEstimator()
+                .Append(r => (r.label, score: ctx.Trainers.OnlineGradientDescent(r.label, r.features, 
+               // lossFunction:loss,
+                onFit: (p) => { pred = p; })));
+
+            var pipe = reader.Append(est);
+
+            Assert.Null(pred);
+            var model = pipe.Fit(dataSource);
+            Assert.NotNull(pred);
+            // 11 input features, so we ought to have 11 weights.
+            VBuffer<float> weights = new VBuffer<float>();
+            pred.GetFeatureWeights(ref weights);
+            Assert.Equal(11, weights.Length);
+
+            var data = model.Read(dataSource);
+
+            var metrics = ctx.Evaluate(data, r => r.label, r => r.score, new PoissonLoss());
+            // Run a sanity check against a few of the metrics.
+            Assert.InRange(metrics.L1, 0, double.PositiveInfinity);
+            Assert.InRange(metrics.L2, 0, double.PositiveInfinity);
+            Assert.InRange(metrics.Rms, 0, double.PositiveInfinity);
+            Assert.Equal(metrics.Rms * metrics.Rms, metrics.L2, 5);
+            Assert.InRange(metrics.LossFn, 0, double.PositiveInfinity);
+        }
     }
 }
diff --git a/test/Microsoft.ML.Tests/TrainerEstimators/OnlineLinearTests.cs b/test/Microsoft.ML.Tests/TrainerEstimators/OnlineLinearTests.cs
index 2dea99e131..693e3ef2c7 100644
--- a/test/Microsoft.ML.Tests/TrainerEstimators/OnlineLinearTests.cs
+++ b/test/Microsoft.ML.Tests/TrainerEstimators/OnlineLinearTests.cs
@@ -25,7 +25,7 @@ public void OnlineLinearWorkout()
 
             var trainData = pipe.Fit(data).Transform(data).AsDynamic;
 
-            IEstimator<ITransformer> est = new OnlineGradientDescentTrainer(Env, new OnlineGradientDescentTrainer.Arguments());
+            IEstimator<ITransformer> est = new OnlineGradientDescentTrainer(Env, "Label", "Features");
             TestEstimatorCore(est, trainData);
 
             est = new AveragedPerceptronTrainer(Env, new AveragedPerceptronTrainer.Arguments());

From 87530b9a8b87f0104d78e6a15c65efe6c6fe043a Mon Sep 17 00:00:00 2001
From: Senja Filipi <sefilipi@microsoft.com>
Date: Fri, 28 Sep 2018 08:52:54 -0700
Subject: [PATCH 04/10] comment, and fixing the check conditions.

---
 .../LogisticRegression/LbfgsPredictorBase.cs  | 26 ++++----
 .../LogisticRegression/LbfgsStatics.cs        | 33 +++++++---
 .../Standard/Online/OnlineLearnerStatic.cs    | 61 ++++++++-----------
 .../Training.cs                               |  6 +-
 4 files changed, 68 insertions(+), 58 deletions(-)

diff --git a/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LbfgsPredictorBase.cs b/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LbfgsPredictorBase.cs
index a0bedf1c11..864e0ba3ab 100644
--- a/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LbfgsPredictorBase.cs
+++ b/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LbfgsPredictorBase.cs
@@ -174,20 +174,20 @@ internal LbfgsTrainerBase(IHostEnvironment env, TArgs args, SchemaShape.Column l
             Host.CheckValue(args, nameof(args));
             Args = args;
 
-            Contracts.CheckUserArg(!Args.UseThreads || Args.NumThreads > 0 || Args.NumThreads == null,
+            Host.CheckUserArg(!Args.UseThreads || Args.NumThreads > 0 || Args.NumThreads == null,
                 nameof(Args.NumThreads), "numThreads must be positive (or empty for default)");
-            Contracts.CheckUserArg(Args.L2Weight >= 0, nameof(Args.L2Weight), "Must be non-negative");
-            Contracts.CheckUserArg(Args.L1Weight >= 0, nameof(Args.L1Weight), "Must be non-negative");
-            Contracts.CheckUserArg(Args.OptTol > 0, nameof(Args.OptTol), "Must be positive");
-            Contracts.CheckUserArg(Args.MemorySize > 0, nameof(Args.MemorySize), "Must be positive");
-            Contracts.CheckUserArg(Args.MaxIterations > 0, nameof(Args.MaxIterations), "Must be positive");
-            Contracts.CheckUserArg(Args.SgdInitializationTolerance >= 0, nameof(Args.SgdInitializationTolerance), "Must be non-negative");
-            Contracts.CheckUserArg(Args.NumThreads == null || Args.NumThreads.Value >= 0, nameof(Args.NumThreads), "Must be non-negative");
-
-            Contracts.CheckParam(l2Weight >= 0, nameof(l2Weight), "Must be non-negative, if provided.");
-            Contracts.CheckParam(l1Weight >= 0, nameof(l1Weight), "Must be non-negative, if provided");
-            Contracts.CheckParam(optimizationTolerance > 0, nameof(optimizationTolerance), "Must be positive, if provided.");
-            Contracts.CheckParam(memorySize > 0, nameof(memorySize), "Must be positive, if provided.");
+            Host.CheckUserArg(Args.L2Weight >= 0, nameof(Args.L2Weight), "Must be non-negative");
+            Host.CheckUserArg(Args.L1Weight >= 0, nameof(Args.L1Weight), "Must be non-negative");
+            Host.CheckUserArg(Args.OptTol > 0, nameof(Args.OptTol), "Must be positive");
+            Host.CheckUserArg(Args.MemorySize > 0, nameof(Args.MemorySize), "Must be positive");
+            Host.CheckUserArg(Args.MaxIterations > 0, nameof(Args.MaxIterations), "Must be positive");
+            Host.CheckUserArg(Args.SgdInitializationTolerance >= 0, nameof(Args.SgdInitializationTolerance), "Must be non-negative");
+            Host.CheckUserArg(Args.NumThreads == null || Args.NumThreads.Value >= 0, nameof(Args.NumThreads), "Must be non-negative");
+
+            Host.CheckParam(!(l2Weight < 0), nameof(l2Weight), "Must be non-negative, if provided.");
+            Host.CheckParam(!(l1Weight < 0), nameof(l1Weight), "Must be non-negative, if provided");
+            Host.CheckParam(!(optimizationTolerance <= 0), nameof(optimizationTolerance), "Must be positive, if provided.");
+            Host.CheckParam(!(memorySize <= 0), nameof(memorySize), "Must be positive, if provided.");
 
             // Review: Warn about the overriding behavior
             L2Weight = l2Weight ?? Args.L2Weight;
diff --git a/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LbfgsStatics.cs b/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LbfgsStatics.cs
index 020a759159..542381f3c1 100644
--- a/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LbfgsStatics.cs
+++ b/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LbfgsStatics.cs
@@ -14,10 +14,11 @@
 namespace Microsoft.ML.Trainers
 {
     using Arguments = LogisticRegression.Arguments;
+
     /// <summary>
-    /// Extension methods and utilities for instantiating LogisticRegression trainer estimators inside statically typed pipelines.
+    /// Binary Classification trainer estimators.
     /// </summary>
-    public static class LogisticRegressionStatics
+    public static partial class BinaryClassificationTrainers
     {
         /// <summary>
         ///  Predict a target using a linear binary classification model trained with the <see cref="Runtime.Learners.LogisticRegression"/> trainer.
@@ -37,7 +38,7 @@ public static class LogisticRegressionStatics
         /// the linear model that was trained.  Note that this action cannot change the result in any way; it is only a way for the caller to
         /// be informed about what was learnt.</param>
         /// <returns>The predicted output.</returns>
-        public static (Scalar<float> score, Scalar<float> probability, Scalar<bool> predictedLabel) LogisticRegression(this BinaryClassificationContext.BinaryClassificationTrainers ctx,
+        public static (Scalar<float> score, Scalar<float> probability, Scalar<bool> predictedLabel) LogisticRegressionBinaryClassifier(this BinaryClassificationContext.BinaryClassificationTrainers ctx,
             Scalar<bool> label,
             Vector<float> features,
             Scalar<float> weights = null,
@@ -48,7 +49,7 @@ public static (Scalar<float> score, Scalar<float> probability, Scalar<bool> pred
             bool enoforceNoNegativity = Arguments.Defaults.EnforceNonNegativity,
             Action<ParameterMixingCalibratedPredictor> onFit = null)
         {
-            ValidateParams(label, features, weights, l1Weight, l2Weight, optimizationTolerance, memorySize, enoforceNoNegativity, onFit);
+            LbfgsStaticsUtils.ValidateParams(label, features, weights, l1Weight, l2Weight, optimizationTolerance, memorySize, enoforceNoNegativity, onFit);
 
             var rec = new TrainerEstimatorReconciler.BinaryClassifier(
                 (env, labelName, featuresName, weightsName) =>
@@ -64,6 +65,13 @@ public static (Scalar<float> score, Scalar<float> probability, Scalar<bool> pred
 
             return rec.Output;
         }
+    }
+
+    /// <summary>
+    /// Regression trainer estimators.
+    /// </summary>
+    public static partial class RegressionTrainers
+    {
 
         /// <summary>
         /// Predict a target using a linear regression model trained with the <see cref="Runtime.Learners.LogisticRegression"/> trainer.
@@ -94,7 +102,7 @@ public static Scalar<float> PoissonRegression(this RegressionContext.RegressionT
             bool enoforceNoNegativity = Arguments.Defaults.EnforceNonNegativity,
             Action<PoissonRegressionPredictor> onFit = null)
         {
-            ValidateParams(label, features, weights, l1Weight, l2Weight, optimizationTolerance, memorySize, enoforceNoNegativity, onFit);
+            LbfgsStaticsUtils.ValidateParams(label, features, weights, l1Weight, l2Weight, optimizationTolerance, memorySize, enoforceNoNegativity, onFit);
 
             var rec = new TrainerEstimatorReconciler.Regression(
                 (env, labelName, featuresName, weightsName) =>
@@ -110,6 +118,13 @@ public static Scalar<float> PoissonRegression(this RegressionContext.RegressionT
 
             return rec.Score;
         }
+    }
+
+    /// <summary>
+    /// MultiClass Classification trainer estimators.
+    /// </summary>
+    public static partial class MultiClassClassificationTrainers
+    {
 
         /// <summary>
         /// Predict a target using a linear multiclass classification model trained with the <see cref="Runtime.Learners.MulticlassLogisticRegression"/> trainer.
@@ -141,7 +156,7 @@ public static (Vector<float> score, Key<uint, TVal> predictedLabel)
             bool enoforceNoNegativity = Arguments.Defaults.EnforceNonNegativity,
             Action<MulticlassLogisticRegressionPredictor> onFit = null)
         {
-            ValidateParams(label, features, weights, l1Weight, l2Weight, optimizationTolerance, memorySize, enoforceNoNegativity, onFit);
+            LbfgsStaticsUtils.ValidateParams(label, features, weights, l1Weight, l2Weight, optimizationTolerance, memorySize, enoforceNoNegativity, onFit);
 
             var rec = new TrainerEstimatorReconciler.MulticlassClassifier<TVal>(
                 (env, labelName, featuresName, weightsName) =>
@@ -157,7 +172,11 @@ public static (Vector<float> score, Key<uint, TVal> predictedLabel)
             return rec.Output;
         }
 
-        private static void ValidateParams(PipelineColumn label,
+    }
+
+    internal sealed class LbfgsStaticsUtils{
+
+        internal static void ValidateParams(PipelineColumn label,
             Vector<float> features,
             Scalar<float> weights = null,
             float l1Weight = Arguments.Defaults.L1Weight,
diff --git a/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs b/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs
index 82e98f6067..cb816107f5 100644
--- a/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs
+++ b/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs
@@ -4,7 +4,6 @@
 
 using Microsoft.ML.Runtime;
 using Microsoft.ML.Runtime.Data;
-using Microsoft.ML.Runtime.Internal.Calibration;
 using Microsoft.ML.Runtime.Learners;
 using Microsoft.ML.StaticPipe;
 using Microsoft.ML.StaticPipe.Runtime;
@@ -12,12 +11,13 @@
 
 namespace Microsoft.ML.Trainers
 {
-    public static class OnlineLearnerStatic
+    /// <summary>
+    /// Binary Classification trainer estimators.
+    /// </summary>
+    public static partial class BinaryClassificationTrainers
     {
         /// <summary>
-        /// Predict a target using a linear binary classification model trained with the SDCA trainer, and a custom loss.
-        /// Note that because we cannot be sure that all loss functions will produce naturally calibrated outputs, setting
-        /// a custom loss function will not produce a calibrated probability column.
+        /// Predict a target using a linear binary classification model trained with the AveragedPerceptron trainer, and a custom loss.
         /// </summary>
         /// <param name="ctx">The binary classification context trainer object.</param>
         /// <param name="label">The label, or dependent variable.</param>
@@ -84,26 +84,32 @@ public static (Scalar<float> score, Scalar<bool> predictedLabel) AveragedPercept
                     else
                         return trainer;
 
-                    /*
-                    if (onFit != null)
-                    {
-                        return trainer.WithOnFitDelegate(trans =>
-                        {
-                            var model = trans.Model;
-                            if (model is ParameterMixingCalibratedPredictor cali)
-                                onFit((LinearBinaryPredictor)cali.SubPredictor);
-                            else
-                                onFit((LinearBinaryPredictor)model);
-                        });
-                    }
-                    return trainer;
-                    */
-
                 }, label, features, weights, hasProbs);
 
             return rec.Output;
         }
 
+        private sealed class TrivialClassificationLossFactory : ISupportClassificationLossFactory
+        {
+            private readonly IClassificationLoss _loss;
+
+            public TrivialClassificationLossFactory(IClassificationLoss loss)
+            {
+                _loss = loss;
+            }
+
+            public IClassificationLoss CreateComponent(IHostEnvironment env)
+            {
+                return _loss;
+            }
+        }
+    }
+
+    /// <summary>
+    /// Regression trainer estimators.
+    /// </summary>
+    public static partial class RegressionTrainers
+    {
         /// <summary>
         /// Predict a target using a linear regression model trained with the <see cref="Runtime.Learners.OnlineGradientDescentTrainer"/> trainer.
         /// </summary>
@@ -150,20 +156,5 @@ public static Scalar<float> OnlineGradientDescent(this RegressionContext.Regress
 
             return rec.Score;
         }
-
-        private sealed class TrivialClassificationLossFactory : ISupportClassificationLossFactory
-        {
-            private readonly IClassificationLoss _loss;
-
-            public TrivialClassificationLossFactory(IClassificationLoss loss)
-            {
-                _loss = loss;
-            }
-
-            public IClassificationLoss CreateComponent(IHostEnvironment env)
-            {
-                return _loss;
-            }
-        }
     }
 }
diff --git a/test/Microsoft.ML.StaticPipelineTesting/Training.cs b/test/Microsoft.ML.StaticPipelineTesting/Training.cs
index 7a8540414e..96665fd6ab 100644
--- a/test/Microsoft.ML.StaticPipelineTesting/Training.cs
+++ b/test/Microsoft.ML.StaticPipelineTesting/Training.cs
@@ -160,9 +160,9 @@ public void SdcaBinaryClassificationNoCalibration()
 
             // With a custom loss function we no longer get calibrated predictions.
             var est = reader.MakeNewEstimator()
-                .Append(r => (r.label, preds: ctx.Trainers.AveragedPerceptron(loss, r.label, r.features,
-                numIterations: 2,
-                onFit: p => pred = p)));
+                .Append(r => (r.label, preds: ctx.Trainers.Sdca(r.label, r.features,
+                maxIterations: 2,
+                loss: loss, onFit: p => pred = p)));
 
             var pipe = reader.Append(est);
 

From 2b58625257baa19556ce349a6bb7bc3cc600443b Mon Sep 17 00:00:00 2001
From: Senja Filipi <sefilipi@microsoft.com>
Date: Fri, 28 Sep 2018 10:26:35 -0700
Subject: [PATCH 05/10] namespace change for pigstensions

---
 Microsoft.ML.sln                              |  2 +-
 .../LogisticRegression/LbfgsStatics.cs        | 24 +++++++++----------
 .../Standard/Online/OnlineLearnerStatic.cs    |  5 ++--
 .../Training.cs                               |  4 ++--
 4 files changed, 16 insertions(+), 19 deletions(-)

diff --git a/Microsoft.ML.sln b/Microsoft.ML.sln
index d6dd898ee3..56c4664666 100644
--- a/Microsoft.ML.sln
+++ b/Microsoft.ML.sln
@@ -119,7 +119,7 @@ Project("{9A19103F-16F7-4668-BE54-9A1E7A4F7556}") = "Microsoft.ML.OnnxTransform"
 EndProject
 Project("{9A19103F-16F7-4668-BE54-9A1E7A4F7556}") = "Microsoft.ML.DnnAnalyzer", "src\Microsoft.ML.DnnAnalyzer\Microsoft.ML.DnnAnalyzer\Microsoft.ML.DnnAnalyzer.csproj", "{73DAAC82-D308-48CC-8FFE-3B037F8BBCCA}"
 EndProject
-Project("{FAE04EC0-301F-11D3-BF4B-00C04F79EFBC}") = "Microsoft.ML.OnnxTransformTest", "test\Microsoft.ML.OnnxTransformTest\Microsoft.ML.OnnxTransformTest.csproj", "{49D03292-8AFE-4B82-823C-D047BF8420F7}"
+Project("{9A19103F-16F7-4668-BE54-9A1E7A4F7556}") = "Microsoft.ML.OnnxTransformTest", "test\Microsoft.ML.OnnxTransformTest\Microsoft.ML.OnnxTransformTest.csproj", "{49D03292-8AFE-4B82-823C-D047BF8420F7}"
 EndProject
 Global
 	GlobalSection(SolutionConfigurationPlatforms) = preSolution
diff --git a/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LbfgsStatics.cs b/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LbfgsStatics.cs
index 542381f3c1..a21f2568cb 100644
--- a/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LbfgsStatics.cs
+++ b/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LbfgsStatics.cs
@@ -7,11 +7,9 @@
 using Microsoft.ML.Runtime.Data;
 using Microsoft.ML.Runtime.Internal.Calibration;
 using Microsoft.ML.Runtime.Learners;
-using Microsoft.ML.Runtime.Training;
-using Microsoft.ML.StaticPipe;
 using Microsoft.ML.StaticPipe.Runtime;
 
-namespace Microsoft.ML.Trainers
+namespace Microsoft.ML.StaticPipe
 {
     using Arguments = LogisticRegression.Arguments;
 
@@ -21,7 +19,7 @@ namespace Microsoft.ML.Trainers
     public static partial class BinaryClassificationTrainers
     {
         /// <summary>
-        ///  Predict a target using a linear binary classification model trained with the <see cref="Runtime.Learners.LogisticRegression"/> trainer.
+        ///  Predict a target using a linear binary classification model trained with the <see cref="Microsoft.ML.Runtime.Learners.LogisticRegression"/> trainer.
         /// </summary>
         /// <param name="ctx">The binary classificaiton context trainer object.</param>
         /// <param name="label">The label, or dependent variable.</param>
@@ -30,7 +28,7 @@ public static partial class BinaryClassificationTrainers
         /// <param name="enoforceNoNegativity">Enforce non-negative weights.</param>
         /// <param name="l1Weight">Weight of L1 regularizer term.</param>
         /// <param name="l2Weight">Weight of L2 regularizer term.</param>
-        /// <param name="memorySize">Memory size for <see cref="Runtime.Learners.LogisticRegression"/>. Lower=faster, less accurate.</param>
+        /// <param name="memorySize">Memory size for <see cref="Microsoft.ML.Runtime.Learners.LogisticRegression"/>. Lower=faster, less accurate.</param>
         /// <param name="optimizationTolerance">Threshold for optimizer convergence.</param>
         /// <param name="onFit">A delegate that is called every time the
         /// <see cref="Estimator{TTupleInShape, TTupleOutShape, TTransformer}.Fit(DataView{TTupleInShape})"/> method is called on the
@@ -49,7 +47,7 @@ public static (Scalar<float> score, Scalar<float> probability, Scalar<bool> pred
             bool enoforceNoNegativity = Arguments.Defaults.EnforceNonNegativity,
             Action<ParameterMixingCalibratedPredictor> onFit = null)
         {
-            LbfgsStaticsUtils.ValidateParams(label, features, weights, l1Weight, l2Weight, optimizationTolerance, memorySize, enoforceNoNegativity, onFit);
+            LbfgsStaticUtils.ValidateParams(label, features, weights, l1Weight, l2Weight, optimizationTolerance, memorySize, enoforceNoNegativity, onFit);
 
             var rec = new TrainerEstimatorReconciler.BinaryClassifier(
                 (env, labelName, featuresName, weightsName) =>
@@ -74,7 +72,7 @@ public static partial class RegressionTrainers
     {
 
         /// <summary>
-        /// Predict a target using a linear regression model trained with the <see cref="Runtime.Learners.LogisticRegression"/> trainer.
+        /// Predict a target using a linear regression model trained with the <see cref="Microsoft.ML.Runtime.Learners.LogisticRegression"/> trainer.
         /// </summary>
         /// <param name="ctx">The regression context trainer object.</param>
         /// <param name="label">The label, or dependent variable.</param>
@@ -83,7 +81,7 @@ public static partial class RegressionTrainers
         /// <param name="enoforceNoNegativity">Enforce non-negative weights.</param>
         /// <param name="l1Weight">Weight of L1 regularizer term.</param>
         /// <param name="l2Weight">Weight of L2 regularizer term.</param>
-        /// <param name="memorySize">Memory size for <see cref="Runtime.Learners.LogisticRegression"/>. Lower=faster, less accurate.</param>
+        /// <param name="memorySize">Memory size for <see cref="Microsoft.ML.Runtime.Learners.LogisticRegression"/>. Lower=faster, less accurate.</param>
         /// <param name="optimizationTolerance">Threshold for optimizer convergence.</param>
         /// <param name="onFit">A delegate that is called every time the
         /// <see cref="Estimator{TTupleInShape, TTupleOutShape, TTransformer}.Fit(DataView{TTupleInShape})"/> method is called on the
@@ -102,7 +100,7 @@ public static Scalar<float> PoissonRegression(this RegressionContext.RegressionT
             bool enoforceNoNegativity = Arguments.Defaults.EnforceNonNegativity,
             Action<PoissonRegressionPredictor> onFit = null)
         {
-            LbfgsStaticsUtils.ValidateParams(label, features, weights, l1Weight, l2Weight, optimizationTolerance, memorySize, enoforceNoNegativity, onFit);
+            LbfgsStaticUtils.ValidateParams(label, features, weights, l1Weight, l2Weight, optimizationTolerance, memorySize, enoforceNoNegativity, onFit);
 
             var rec = new TrainerEstimatorReconciler.Regression(
                 (env, labelName, featuresName, weightsName) =>
@@ -127,7 +125,7 @@ public static partial class MultiClassClassificationTrainers
     {
 
         /// <summary>
-        /// Predict a target using a linear multiclass classification model trained with the <see cref="Runtime.Learners.MulticlassLogisticRegression"/> trainer.
+        /// Predict a target using a linear multiclass classification model trained with the <see cref="Microsoft.ML.Runtime.Learners.MulticlassLogisticRegression"/> trainer.
         /// </summary>
         /// <param name="ctx">The multiclass classification context trainer object.</param>
         /// <param name="label">The label, or dependent variable.</param>
@@ -136,7 +134,7 @@ public static partial class MultiClassClassificationTrainers
         /// <param name="enoforceNoNegativity">Enforce non-negative weights.</param>
         /// <param name="l1Weight">Weight of L1 regularizer term.</param>
         /// <param name="l2Weight">Weight of L2 regularizer term.</param>
-        /// <param name="memorySize">Memory size for <see cref="Runtime.Learners.LogisticRegression"/>. Lower=faster, less accurate.</param>
+        /// <param name="memorySize">Memory size for <see cref="Microsoft.ML.Runtime.Learners.LogisticRegression"/>. Lower=faster, less accurate.</param>
         /// <param name="optimizationTolerance">Threshold for optimizer convergence.</param>
         /// <param name="onFit">A delegate that is called every time the
         /// <see cref="Estimator{TTupleInShape, TTupleOutShape, TTransformer}.Fit(DataView{TTupleInShape})"/> method is called on the
@@ -156,7 +154,7 @@ public static (Vector<float> score, Key<uint, TVal> predictedLabel)
             bool enoforceNoNegativity = Arguments.Defaults.EnforceNonNegativity,
             Action<MulticlassLogisticRegressionPredictor> onFit = null)
         {
-            LbfgsStaticsUtils.ValidateParams(label, features, weights, l1Weight, l2Weight, optimizationTolerance, memorySize, enoforceNoNegativity, onFit);
+            LbfgsStaticUtils.ValidateParams(label, features, weights, l1Weight, l2Weight, optimizationTolerance, memorySize, enoforceNoNegativity, onFit);
 
             var rec = new TrainerEstimatorReconciler.MulticlassClassifier<TVal>(
                 (env, labelName, featuresName, weightsName) =>
@@ -174,7 +172,7 @@ public static (Vector<float> score, Key<uint, TVal> predictedLabel)
 
     }
 
-    internal sealed class LbfgsStaticsUtils{
+    internal static class LbfgsStaticUtils{
 
         internal static void ValidateParams(PipelineColumn label,
             Vector<float> features,
diff --git a/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs b/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs
index cb816107f5..ba2087a6ff 100644
--- a/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs
+++ b/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs
@@ -5,11 +5,10 @@
 using Microsoft.ML.Runtime;
 using Microsoft.ML.Runtime.Data;
 using Microsoft.ML.Runtime.Learners;
-using Microsoft.ML.StaticPipe;
 using Microsoft.ML.StaticPipe.Runtime;
 using System;
 
-namespace Microsoft.ML.Trainers
+namespace Microsoft.ML.StaticPipe
 {
     /// <summary>
     /// Binary Classification trainer estimators.
@@ -111,7 +110,7 @@ public IClassificationLoss CreateComponent(IHostEnvironment env)
     public static partial class RegressionTrainers
     {
         /// <summary>
-        /// Predict a target using a linear regression model trained with the <see cref="Runtime.Learners.OnlineGradientDescentTrainer"/> trainer.
+        /// Predict a target using a linear regression model trained with the <see cref="Microsoft.ML.Runtime.Learners.OnlineGradientDescentTrainer"/> trainer.
         /// </summary>
         /// <param name="ctx">The regression context trainer object.</param>
         /// <param name="label">The label, or dependent variable.</param>
diff --git a/test/Microsoft.ML.StaticPipelineTesting/Training.cs b/test/Microsoft.ML.StaticPipelineTesting/Training.cs
index 96665fd6ab..dbca9b7fa4 100644
--- a/test/Microsoft.ML.StaticPipelineTesting/Training.cs
+++ b/test/Microsoft.ML.StaticPipelineTesting/Training.cs
@@ -11,7 +11,7 @@
 using Microsoft.ML.Runtime.Learners;
 using Microsoft.ML.Runtime.LightGBM;
 using Microsoft.ML.Runtime.RunTests;
-using Microsoft.ML.Runtime.Training;
+using Microsoft.ML.StaticPipe;
 using Microsoft.ML.Trainers;
 using System;
 using System.Linq;
@@ -544,7 +544,7 @@ public void LogisticRegressionBinaryClassification()
             IPredictorWithFeatureWeights<float> pred = null;
 
             var est = reader.MakeNewEstimator()
-                .Append(r => (r.label, preds: ctx.Trainers.LogisticRegression(r.label, r.features,
+                .Append(r => (r.label, preds: ctx.Trainers.LogisticRegressionBinaryClassifier(r.label, r.features,
                     l1Weight: 10,
                     onFit: (p) => { pred = p; })));
 

From 03c1cdc812fcb367f83307e2e87d97098a673971 Mon Sep 17 00:00:00 2001
From: Senja Filipi <sefilipi@microsoft.com>
Date: Fri, 28 Sep 2018 10:49:04 -0700
Subject: [PATCH 06/10] namespace change, more checks on user params

---
 .../KMeansStatic.cs                           | 28 +++++++++-------
 .../Standard/Online/OnlineLearnerStatic.cs    | 33 ++++++++++++++-----
 2 files changed, 41 insertions(+), 20 deletions(-)

diff --git a/src/Microsoft.ML.KMeansClustering/KMeansStatic.cs b/src/Microsoft.ML.KMeansClustering/KMeansStatic.cs
index 2a64ef8d31..d75ddddd74 100644
--- a/src/Microsoft.ML.KMeansClustering/KMeansStatic.cs
+++ b/src/Microsoft.ML.KMeansClustering/KMeansStatic.cs
@@ -2,13 +2,13 @@
 // The .NET Foundation licenses this file to you under the MIT license.
 // See the LICENSE file in the project root for more information.
 
+using Microsoft.ML.Runtime;
 using Microsoft.ML.Runtime.Data;
 using Microsoft.ML.Runtime.KMeans;
-using Microsoft.ML.StaticPipe;
 using Microsoft.ML.StaticPipe.Runtime;
 using System;
 
-namespace Microsoft.ML.Trainers
+namespace Microsoft.ML.StaticPipe
 {
     /// <summary>
     /// The trainer context extensions for the <see cref="KMeansPlusPlusTrainer"/>.
@@ -35,16 +35,22 @@ public static (Vector<float> score, Key<uint> predictedLabel) KMeans(this Cluste
            Action<KMeansPlusPlusTrainer.Arguments> advancedSettings = null,
            Action<KMeansPredictor> onFit = null)
         {
-               var rec = new TrainerEstimatorReconciler.Clustering(
-               (env, featuresName, weightsName) =>
-               {
-                   var trainer = new KMeansPlusPlusTrainer(env, featuresName, clustersCount, weightsName, advancedSettings);
+            Contracts.CheckValue(features, nameof(features));
+            Contracts.CheckValueOrNull(weights);
+            Contracts.CheckParam(clustersCount > 1, nameof(clustersCount), "If provided, must be greater than 1.");
+            Contracts.CheckValueOrNull(onFit);
+            Contracts.CheckValueOrNull(advancedSettings);
 
-                   if (onFit != null)
-                       return trainer.WithOnFitDelegate(trans => onFit(trans.Model));
-                   else
-                       return trainer;
-               }, features, weights);
+            var rec = new TrainerEstimatorReconciler.Clustering(
+            (env, featuresName, weightsName) =>
+            {
+                var trainer = new KMeansPlusPlusTrainer(env, featuresName, clustersCount, weightsName, advancedSettings);
+
+                if (onFit != null)
+                    return trainer.WithOnFitDelegate(trans => onFit(trans.Model));
+                else
+                    return trainer;
+            }, features, weights);
 
             return rec.Output;
         }
diff --git a/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs b/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs
index ba2087a6ff..03637bb1b0 100644
--- a/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs
+++ b/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs
@@ -46,15 +46,7 @@ public static (Scalar<float> score, Scalar<bool> predictedLabel) AveragedPercept
                 Action<LinearBinaryPredictor> onFit = null
             )
         {
-            Contracts.CheckValue(label, nameof(label));
-            Contracts.CheckValue(features, nameof(features));
-            Contracts.CheckValue(lossFunction, nameof(lossFunction));
-            Contracts.CheckValueOrNull(weights);
-            Contracts.CheckParam(learningRate > 0, nameof(learningRate), "Must be positive.");
-            Contracts.CheckParam(0 <= l2RegularizerWeight && l2RegularizerWeight < 0.5, nameof(l2RegularizerWeight), "must be in range [0, 0.5)");
-
-            Contracts.CheckParam(numIterations > 1, nameof(numIterations), "Must be greater than one, if specified.");
-            Contracts.CheckValueOrNull(onFit);
+            OnlineLinearStaticUtils.CheckUserParams(label, features, weights, learningRate, l2RegularizerWeight, numIterations, onFit);
 
             bool hasProbs = lossFunction is HingeLoss;
 
@@ -141,6 +133,9 @@ public static Scalar<float> OnlineGradientDescent(this RegressionContext.Regress
             int numIterations = OnlineGradientDescentTrainer.Arguments.OgdDefaultArgs.NumIterations,
             Action<LinearRegressionPredictor> onFit = null)
         {
+            OnlineLinearStaticUtils.CheckUserParams(label, features, weights, learningRate, l2RegularizerWeight, numIterations, onFit);
+            Contracts.CheckValueOrNull(lossFunction);
+
             var rec = new TrainerEstimatorReconciler.Regression(
                 (env, labelName, featuresName, weightsName) =>
                 {
@@ -156,4 +151,24 @@ public static Scalar<float> OnlineGradientDescent(this RegressionContext.Regress
             return rec.Score;
         }
     }
+
+    internal static class OnlineLinearStaticUtils{
+
+        internal static void CheckUserParams(PipelineColumn label,
+            PipelineColumn features,
+            PipelineColumn weights,
+            float learningRate,
+            float l2RegularizerWeight,
+            int numIterations,
+            Delegate onFit)
+        {
+            Contracts.CheckValue(label, nameof(label));
+            Contracts.CheckValue(features, nameof(features));
+            Contracts.CheckValueOrNull(weights);
+            Contracts.CheckParam(learningRate > 0, nameof(learningRate), "Must be positive.");
+            Contracts.CheckParam(0 <= l2RegularizerWeight && l2RegularizerWeight < 0.5, nameof(l2RegularizerWeight), "must be in range [0, 0.5)");
+            Contracts.CheckParam(numIterations > 1, nameof(numIterations), "Must be greater than one, if specified.");
+            Contracts.CheckValueOrNull(onFit);
+        }
+    }
 }

From dabf5915fc85f4588937764905438552344f16ea Mon Sep 17 00:00:00 2001
From: Senja Filipi <sefilipi@microsoft.com>
Date: Fri, 28 Sep 2018 10:50:49 -0700
Subject: [PATCH 07/10] casing and help sentences nit

---
 .../Standard/LogisticRegression/LbfgsStatics.cs      | 12 ++++++------
 .../Standard/Online/OnlineLearnerStatic.cs           |  4 ++--
 2 files changed, 8 insertions(+), 8 deletions(-)

diff --git a/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LbfgsStatics.cs b/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LbfgsStatics.cs
index a21f2568cb..71227d2155 100644
--- a/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LbfgsStatics.cs
+++ b/src/Microsoft.ML.StandardLearners/Standard/LogisticRegression/LbfgsStatics.cs
@@ -26,8 +26,8 @@ public static partial class BinaryClassificationTrainers
         /// <param name="features">The features, or independent variables.</param>
         /// <param name="weights">The optional example weights.</param>
         /// <param name="enoforceNoNegativity">Enforce non-negative weights.</param>
-        /// <param name="l1Weight">Weight of L1 regularizer term.</param>
-        /// <param name="l2Weight">Weight of L2 regularizer term.</param>
+        /// <param name="l1Weight">Weight of L1 regularization term.</param>
+        /// <param name="l2Weight">Weight of L2 regularization term.</param>
         /// <param name="memorySize">Memory size for <see cref="Microsoft.ML.Runtime.Learners.LogisticRegression"/>. Lower=faster, less accurate.</param>
         /// <param name="optimizationTolerance">Threshold for optimizer convergence.</param>
         /// <param name="onFit">A delegate that is called every time the
@@ -79,8 +79,8 @@ public static partial class RegressionTrainers
         /// <param name="features">The features, or independent variables.</param>
         /// <param name="weights">The optional example weights.</param>
         /// <param name="enoforceNoNegativity">Enforce non-negative weights.</param>
-        /// <param name="l1Weight">Weight of L1 regularizer term.</param>
-        /// <param name="l2Weight">Weight of L2 regularizer term.</param>
+        /// <param name="l1Weight">Weight of L1 regularization term.</param>
+        /// <param name="l2Weight">Weight of L2 regularization term.</param>
         /// <param name="memorySize">Memory size for <see cref="Microsoft.ML.Runtime.Learners.LogisticRegression"/>. Lower=faster, less accurate.</param>
         /// <param name="optimizationTolerance">Threshold for optimizer convergence.</param>
         /// <param name="onFit">A delegate that is called every time the
@@ -132,8 +132,8 @@ public static partial class MultiClassClassificationTrainers
         /// <param name="features">The features, or independent variables.</param>
         /// <param name="weights">The optional example weights.</param>
         /// <param name="enoforceNoNegativity">Enforce non-negative weights.</param>
-        /// <param name="l1Weight">Weight of L1 regularizer term.</param>
-        /// <param name="l2Weight">Weight of L2 regularizer term.</param>
+        /// <param name="l1Weight">Weight of L1 regularization term.</param>
+        /// <param name="l2Weight">Weight of L2 regularization term.</param>
         /// <param name="memorySize">Memory size for <see cref="Microsoft.ML.Runtime.Learners.LogisticRegression"/>. Lower=faster, less accurate.</param>
         /// <param name="optimizationTolerance">Threshold for optimizer convergence.</param>
         /// <param name="onFit">A delegate that is called every time the
diff --git a/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs b/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs
index 03637bb1b0..1998dd0607 100644
--- a/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs
+++ b/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs
@@ -25,7 +25,7 @@ public static partial class BinaryClassificationTrainers
         /// <param name="weights">The optional example weights.</param>
         /// <param name="learningRate">The learning Rate.</param>
         /// <param name="decreaseLearningRate">Decrease learning rate as iterations progress.</param>
-        /// <param name="l2RegularizerWeight">L2 Regularization Weight.</param>
+        /// <param name="l2RegularizerWeight">L2 regularization weight.</param>
         /// <param name="numIterations">Number of training iterations through the data.</param>
         /// <param name="onFit">A delegate that is called every time the
         /// <see cref="Estimator{TTupleInShape, TTupleOutShape, TTransformer}.Fit(DataView{TTupleInShape})"/> method is called on the
@@ -111,7 +111,7 @@ public static partial class RegressionTrainers
         /// <param name="lossFunction">The custom loss. Defaults to <see cref="SquaredLoss"/> if not provided.</param>
         /// <param name="learningRate">The learning Rate.</param>
         /// <param name="decreaseLearningRate">Decrease learning rate as iterations progress.</param>
-        /// <param name="l2RegularizerWeight">L2 Regularization Weight.</param>
+        /// <param name="l2RegularizerWeight">L2 regularization weight.</param>
         /// <param name="numIterations">Number of training iterations through the data.</param>
         /// <param name="onFit">A delegate that is called every time the
         /// <see cref="Estimator{TTupleInShape, TTupleOutShape, TTransformer}.Fit(DataView{TTupleInShape})"/> method is called on the

From 2f42b80e7ecdf88314252895df3705dbacb09382 Mon Sep 17 00:00:00 2001
From: Senja Filipi <sefilipi@microsoft.com>
Date: Fri, 28 Sep 2018 10:55:05 -0700
Subject: [PATCH 08/10] cleaning up System.Single

---
 .../Standard/Online/OnlineGradientDescent.cs           | 10 ++++------
 1 file changed, 4 insertions(+), 6 deletions(-)

diff --git a/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineGradientDescent.cs b/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineGradientDescent.cs
index b9b4a6b11c..9c39e3cb7f 100644
--- a/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineGradientDescent.cs
+++ b/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineGradientDescent.cs
@@ -2,8 +2,6 @@
 // The .NET Foundation licenses this file to you under the MIT license.
 // See the LICENSE file in the project root for more information.
 
-using Float = System.Single;
-
 using Microsoft.ML.Core.Data;
 using Microsoft.ML.Runtime;
 using Microsoft.ML.Runtime.CommandLine;
@@ -117,8 +115,8 @@ protected override void CheckLabel(RoleMappedData data)
         protected override LinearRegressionPredictor CreatePredictor()
         {
             Contracts.Assert(WeightsScale == 1);
-            VBuffer<Float> weights = default(VBuffer<Float>);
-            Float bias;
+            VBuffer<float> weights = default(VBuffer<float>);
+            float bias;
 
             if (!Args.Averaged)
             {
@@ -128,8 +126,8 @@ protected override LinearRegressionPredictor CreatePredictor()
             else
             {
                 TotalWeights.CopyTo(ref weights);
-                VectorUtils.ScaleBy(ref weights, 1 / (Float)NumWeightUpdates);
-                bias = TotalBias / (Float)NumWeightUpdates;
+                VectorUtils.ScaleBy(ref weights, 1 / (float)NumWeightUpdates);
+                bias = TotalBias / (float)NumWeightUpdates;
             }
             return new LinearRegressionPredictor(Host, ref weights, bias);
         }

From e01ff3f98030839fe2132ce85c5039ec0cc023b7 Mon Sep 17 00:00:00 2001
From: Senja Filipi <sefilipi@microsoft.com>
Date: Fri, 28 Sep 2018 10:55:54 -0700
Subject: [PATCH 09/10] ctrl+k+d

---
 .../Standard/Online/OnlineGradientDescent.cs                | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineGradientDescent.cs b/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineGradientDescent.cs
index 9c39e3cb7f..00dfb59cbd 100644
--- a/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineGradientDescent.cs
+++ b/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineGradientDescent.cs
@@ -50,8 +50,8 @@ public Arguments()
 
             internal class OgdDefaultArgs : AveragedDefaultArgs
             {
-               internal new const float LearningRate = 0.1f;
-               internal new const bool DecreaseLearningRate = true;
+                internal new const float LearningRate = 0.1f;
+                internal new const bool DecreaseLearningRate = true;
             }
         }
 
@@ -71,7 +71,7 @@ public OnlineGradientDescentTrainer(IHostEnvironment env,
             string labelColumn,
             string featureColumn,
             float learningRate = Arguments.OgdDefaultArgs.LearningRate,
-            bool decreaseLearningRate =Arguments.OgdDefaultArgs.DecreaseLearningRate,
+            bool decreaseLearningRate = Arguments.OgdDefaultArgs.DecreaseLearningRate,
             float l2RegularizerWeight = Arguments.OgdDefaultArgs.L2RegularizerWeight,
             int numIterations = Arguments.OgdDefaultArgs.NumIterations,
             string weightsColumn = null,

From 35a065fa53a93f870a29283f2f92ffc0e9bf9776 Mon Sep 17 00:00:00 2001
From: Senja Filipi <sefilipi@microsoft.com>
Date: Fri, 28 Sep 2018 11:34:14 -0700
Subject: [PATCH 10/10] restoring the change on the solution. off by one fix .

---
 Microsoft.ML.sln                                                | 2 +-
 .../Standard/Online/OnlineLearnerStatic.cs                      | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/Microsoft.ML.sln b/Microsoft.ML.sln
index c4a02ca217..1b12394544 100644
--- a/Microsoft.ML.sln
+++ b/Microsoft.ML.sln
@@ -119,7 +119,7 @@ Project("{9A19103F-16F7-4668-BE54-9A1E7A4F7556}") = "Microsoft.ML.OnnxTransform"
 EndProject
 Project("{9A19103F-16F7-4668-BE54-9A1E7A4F7556}") = "Microsoft.ML.DnnAnalyzer", "src\Microsoft.ML.DnnAnalyzer\Microsoft.ML.DnnAnalyzer\Microsoft.ML.DnnAnalyzer.csproj", "{73DAAC82-D308-48CC-8FFE-3B037F8BBCCA}"
 EndProject
-Project("{9A19103F-16F7-4668-BE54-9A1E7A4F7556}") = "Microsoft.ML.OnnxTransformTest", "test\Microsoft.ML.OnnxTransformTest\Microsoft.ML.OnnxTransformTest.csproj", "{49D03292-8AFE-4B82-823C-D047BF8420F7}"
+Project("{FAE04EC0-301F-11D3-BF4B-00C04F79EFBC}") = "Microsoft.ML.OnnxTransformTest", "test\Microsoft.ML.OnnxTransformTest\Microsoft.ML.OnnxTransformTest.csproj", "{49D03292-8AFE-4B82-823C-D047BF8420F7}"
 EndProject
 Project("{9A19103F-16F7-4668-BE54-9A1E7A4F7556}") = "Microsoft.ML.Benchmarks.Tests", "test\Microsoft.ML.Benchmarks.Tests\Microsoft.ML.Benchmarks.Tests.csproj", "{B6C83F04-A04B-4F00-9E68-1EC411F9317C}"
 EndProject
diff --git a/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs b/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs
index 1998dd0607..de286a59c8 100644
--- a/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs
+++ b/src/Microsoft.ML.StandardLearners/Standard/Online/OnlineLearnerStatic.cs
@@ -167,7 +167,7 @@ internal static void CheckUserParams(PipelineColumn label,
             Contracts.CheckValueOrNull(weights);
             Contracts.CheckParam(learningRate > 0, nameof(learningRate), "Must be positive.");
             Contracts.CheckParam(0 <= l2RegularizerWeight && l2RegularizerWeight < 0.5, nameof(l2RegularizerWeight), "must be in range [0, 0.5)");
-            Contracts.CheckParam(numIterations > 1, nameof(numIterations), "Must be greater than one, if specified.");
+            Contracts.CheckParam(numIterations > 0, nameof(numIterations), "Must be positive, if specified.");
             Contracts.CheckValueOrNull(onFit);
         }
     }