SymSGD documentation (#3345)

Ivanidzo4ka · web-flow · commit 82dd1869e1a2 · 2019-04-16T17:04:53.000-07:00
diff --git a/docs/api-reference/io-columns-binary-classification.md b/docs/api-reference/io-columns-binary-classification.md
@@ -4,5 +4,5 @@ The input label column data must be <xref:System.Single>. This trainer outputs t
 | Output Column Name | Column Type | Description|
 | -- | -- | -- |
 | `Score` | <xref:System.Single> | The unbounded score that was calculated by the trainer to determine the prediction.|
-| `PredictedLabel` | <xref:System.Boolean> | The label predicted by the trainer. `false` maps to negative score and   `true` maps to positive score.|
-| `Probability` | <xref:System.Single> | The probability of the score in range [0, 1].|
+| `PredictedLabel` | <xref:System.Boolean> | The label predicted by the trainer. `false` maps to negative score and `true` maps to positive score.|
+| `Probability` | <xref:System.Single> | The probability of having true as the label. Probability value is in range [0, 1].||
diff --git a/src/Microsoft.ML.Mkl.Components.StaticPipe/VectorWhiteningStaticExtensions.cs b/src/Microsoft.ML.Mkl.Components.StaticPipe/VectorWhiteningStaticExtensions.cs
@@ -56,7 +56,6 @@ public override IEstimator<ITransformer> Reconcile(IHostEnvironment env,
             }
         }
 
-        /// <include file='../Microsoft.ML.Mkl.Components/doc.xml' path='doc/members/member[@name="Whitening"]/*'/>
         /// <param name="input">The column to which the transform will be applied.</param>
         /// <param name="eps">Whitening constant, prevents division by zero when scaling the data by inverse of eigenvalues.</param>
         /// <param name="maxRows">Maximum number of rows used to train the transform.</param>
@@ -67,7 +66,6 @@ public static Vector<float> PcaWhitening(this Vector<float> input,
             int pcaNum = VectorWhiteningEstimator.Defaults.Rank)
             => new OutPipelineColumn(input, WhiteningKind.PrincipalComponentAnalysis, eps, maxRows, pcaNum);
 
-        /// <include file='../Microsoft.ML.Mkl.Components/doc.xml' path='doc/members/member[@name="Whitening"]/*'/>
         /// <param name="input">The column to which the transform will be applied.</param>
         /// <param name="eps">Whitening constant, prevents division by zero.</param>
         /// <param name="maxRows">Maximum number of rows used to train the transform.</param>
diff --git a/src/Microsoft.ML.Mkl.Components/MklComponentsCatalog.cs b/src/Microsoft.ML.Mkl.Components/MklComponentsCatalog.cs
@@ -69,13 +69,13 @@ public static OlsTrainer Ols(
         }
 
         /// <summary>
-        /// Predict a target using a linear binary classification model trained with the <see cref="SymbolicSgdLogisticRegressionBinaryTrainer"/>.
+        /// Create an <see cref="SymbolicSgdLogisticRegressionBinaryTrainer"/> with advanced options, which predicts a target using a linear binary classification model trained over boolean label data.
         /// Stochastic gradient descent (SGD) is an iterative algorithm that optimizes a differentiable objective function.
         /// The <see cref="SymbolicSgdLogisticRegressionBinaryTrainer"/> parallelizes SGD using <a href="https://www.microsoft.com/en-us/research/project/project-parade/#!symbolic-execution">symbolic execution</a>.
         /// </summary>
         /// <param name="catalog">The <see cref="BinaryClassificationCatalog"/>.</param>
-        /// <param name="labelColumnName">The name of the label column.</param>
-        /// <param name="featureColumnName">The name of the feature column.</param>
+        /// <param name="labelColumnName">The name of the label column. The column data must be <see cref="System.Boolean"/>.</param>
+        /// <param name="featureColumnName">The name of the feature column. The column data must be a known-sized vector of <see cref="System.Single"/>.</param>
         /// <param name="numberOfIterations">Number of training iterations.</param>
         /// <example>
         /// <format type="text/markdown">
@@ -102,7 +102,7 @@ public static SymbolicSgdLogisticRegressionBinaryTrainer SymbolicSgdLogisticRegr
         }
 
         /// <summary>
-        ///  Predict a target using a linear binary classification model trained with the <see cref="SymbolicSgdLogisticRegressionBinaryTrainer"/>.
+        /// Create an<see cref= "SymbolicSgdLogisticRegressionBinaryTrainer" />, which predicts a target using a linear binary classification model trained over boolean label data.
         /// Stochastic gradient descent (SGD) is an iterative algorithm that optimizes a differentiable objective function.
         /// The <see cref="SymbolicSgdLogisticRegressionBinaryTrainer"/> parallelizes SGD using <a href="https://www.microsoft.com/en-us/research/project/project-parade/#!symbolic-execution">symbolic execution</a>.
         /// </summary>
diff --git a/src/Microsoft.ML.Mkl.Components/SymSgdClassificationTrainer.cs b/src/Microsoft.ML.Mkl.Components/SymSgdClassificationTrainer.cs
@@ -31,14 +31,49 @@ namespace Microsoft.ML.Trainers
 {
     using TPredictor = CalibratedModelParametersBase<LinearBinaryModelParameters, PlattCalibrator>;
 
-    /// <include file='doc.xml' path='doc/members/member[@name="SymSGD"]/*' />
+    /// <summary>
+    /// The <see cref="IEstimator{TTransformer}"/> to predict a target using a linear binary classification model trained with the symbolic stochastic gradient descent.
+    /// </summary>
+    /// <remarks>
+    /// <format type="text/markdown"><![CDATA[
+    /// To create this trainer, use [SymbolicStochasticGradientDescent](xref:Microsoft.ML.MklComponentsCatalog.SymbolicSgdLogisticRegression(Microsoft.ML.BinaryClassificationCatalog.BinaryClassificationTrainers,System.String,System.String,System.Int32)
+    /// or [SymbolicStochasticGradientDescent(Options)](xref:Microsoft.ML.MklComponentsCatalog.SymbolicSgdLogisticRegression(Microsoft.ML.BinaryClassificationCatalog.BinaryClassificationTrainers,Microsoft.ML.Trainers.SymbolicSgdLogisticRegressionBinaryTrainer.Options).
+    ///
+    /// [!include[io](~/../docs/samples/docs/api-reference/io-columns-binary-classification.md)]
+    ///
+    /// ### Trainer Characteristics
+    /// |  |  |
+    /// | -- | -- |
+    /// | Machine learning task | Binary classification |
+    /// | Is normalization required? | Yes |
+    /// | Is caching required? | No |
+    /// | Required NuGet in addition to Microsoft.ML |Microsoft.ML.Mkl.Components |
+    /// ### Training Algorithm Details
+    /// The symbolic SGD is a classification algorithm that makes its predictions by finding a separating hyperplane.
+    /// For instance, with feature values $f0, f1,..., f_{D-1}$, the prediction is given by determining what side of the hyperplane the point falls into.
+    /// That is the same as the sign of the feautures' weighted sum, i.e. $\sum_{i = 0}^{D-1} (w_i * f_i)$, where $w_0, w_1,..., w_{D-1}$ are the weights computed by the algorithm.
+    ///
+    /// While most of SGD algorithms is inherently sequential - at each step, the processing of the current example depends on the parameters learned from previous examples.
+    /// This algorithm trains local models in separate threads and probabilistic model cobminer that allows the local models to be combined
+    /// to produce the same result as what a sequential SGD would have produced, in expectation.
+    ///
+    /// For more information see [Parallel Stochastic Gradient Descent with Sound Combiners](https://arxiv.org/abs/1705.08030).
+    /// ]]>
+    /// </format>
+    /// </remarks>
+    /// <seealso cref="MklComponentsCatalog.SymbolicSgdLogisticRegression(BinaryClassificationCatalog.BinaryClassificationTrainers, string, string, int)" />
+    /// <seealso cref="MklComponentsCatalog.SymbolicSgdLogisticRegression(BinaryClassificationCatalog.BinaryClassificationTrainers, Options)"/>
+    /// <seealso cref="Options"/>
     public sealed class SymbolicSgdLogisticRegressionBinaryTrainer : TrainerEstimatorBase<BinaryPredictionTransformer<TPredictor>, TPredictor>
     {
         internal const string LoadNameValue = "SymbolicSGD";
         internal const string UserNameValue = "Symbolic SGD (binary)";
         internal const string ShortName = "SymSGD";
 
-        ///<summary> Advanced options for trainer.</summary>
+        /// <summary>
+        /// Options for the <see cref="SymbolicSgdLogisticRegressionBinaryTrainer"/> as used in
+        /// [SymbolicStochasticGradientDescent(Options)](xref:Microsoft.ML.MklComponentsCatalog.SymbolicSgdLogisticRegression(Microsoft.ML.BinaryClassificationCatalog.BinaryClassificationTrainers,Microsoft.ML.Trainers.SymbolicSgdLogisticRegressionBinaryTrainer.Options).
+        /// </summary>
         public sealed class Options : TrainerInputBaseWithLabel
         {
             /// <summary>
diff --git a/src/Microsoft.ML.Mkl.Components/VectorWhitening.cs b/src/Microsoft.ML.Mkl.Components/VectorWhitening.cs
@@ -46,7 +46,6 @@ public enum WhiteningKind
         ZeroPhaseComponentAnalysis
     }
 
-    /// <include file='doc.xml' path='doc/members/member[@name="Whitening"]/*'/>
     public sealed class VectorWhiteningTransformer : OneToOneTransformerBase
     {
         internal sealed class Options
@@ -666,7 +665,6 @@ private static float DotProduct(float[] a, int aOffset, ReadOnlySpan<float> b, R
         }
     }
 
-    /// <include file='doc.xml' path='doc/members/member[@name="Whitening"]/*'/>
     public sealed class VectorWhiteningEstimator : IEstimator<VectorWhiteningTransformer>
     {
         [BestFriend]
@@ -801,7 +799,6 @@ internal void Save(ModelSaveContext ctx)
         private readonly IHost _host;
         private readonly ColumnOptions[] _infos;
 
-        /// <include file='doc.xml' path='doc/members/member[@name="Whitening"]/*'/>
         /// <param name="env">The environment.</param>
         /// <param name="columns">Describes the parameters of the whitening process for each column pair.</param>
         internal VectorWhiteningEstimator(IHostEnvironment env, params ColumnOptions[] columns)
@@ -810,7 +807,6 @@ internal VectorWhiteningEstimator(IHostEnvironment env, params ColumnOptions[] c
             _infos = columns;
         }
 
-        /// <include file='doc.xml' path='doc/members/member[@name="Whitening"]/*'/>
         /// <param name="env">The environment.</param>
         /// <param name="outputColumnName">Name of the column resulting from the transformation of <paramref name="inputColumnName"/>.</param>
         /// <param name="inputColumnName">Name of column to transform. If set to <see langword="null"/>, the value of the <paramref name="outputColumnName"/> will be used as source.</param>
diff --git a/src/Microsoft.ML.Mkl.Components/doc.xml b/src/Microsoft.ML.Mkl.Components/doc.xml

Original file line number	Diff line number	Diff line change
`@@ -56,7 +56,6 @@ public override IEstimator<ITransformer> Reconcile(IHostEnvironment env,`
`56`	`56`	`}`
`57`	`57`	`}`
`58`	`58`
`59`		`- /// <include file='../Microsoft.ML.Mkl.Components/doc.xml' path='doc/members/member[@name="Whitening"]/*'/>`
`60`	`59`	`/// <param name="input">The column to which the transform will be applied.</param>`
`61`	`60`	`/// <param name="eps">Whitening constant, prevents division by zero when scaling the data by inverse of eigenvalues.</param>`
`62`	`61`	`/// <param name="maxRows">Maximum number of rows used to train the transform.</param>`
`@@ -67,7 +66,6 @@ public static Vector<float> PcaWhitening(this Vector<float> input,`
`67`	`66`	`int pcaNum = VectorWhiteningEstimator.Defaults.Rank)`
`68`	`67`	`=> new OutPipelineColumn(input, WhiteningKind.PrincipalComponentAnalysis, eps, maxRows, pcaNum);`
`69`	`68`
`70`		`- /// <include file='../Microsoft.ML.Mkl.Components/doc.xml' path='doc/members/member[@name="Whitening"]/*'/>`
`71`	`69`	`/// <param name="input">The column to which the transform will be applied.</param>`
`72`	`70`	`/// <param name="eps">Whitening constant, prevents division by zero.</param>`
`73`	`71`	`/// <param name="maxRows">Maximum number of rows used to train the transform.</param>`
Original file line number	Diff line number	Diff line change
`@@ -46,7 +46,6 @@ public enum WhiteningKind`
`46`	`46`	`ZeroPhaseComponentAnalysis`
`47`	`47`	`}`
`48`	`48`
`49`		`- /// <include file='doc.xml' path='doc/members/member[@name="Whitening"]/*'/>`
`50`	`49`	`public sealed class VectorWhiteningTransformer : OneToOneTransformerBase`
`51`	`50`	`{`
`52`	`51`	`internal sealed class Options`
`@@ -666,7 +665,6 @@ private static float DotProduct(float[] a, int aOffset, ReadOnlySpan<float> b, R`
`666`	`665`	`}`
`667`	`666`	`}`
`668`	`667`
`669`		`- /// <include file='doc.xml' path='doc/members/member[@name="Whitening"]/*'/>`
`670`	`668`	`public sealed class VectorWhiteningEstimator : IEstimator<VectorWhiteningTransformer>`
`671`	`669`	`{`
`672`	`670`	`[BestFriend]`
`@@ -801,7 +799,6 @@ internal void Save(ModelSaveContext ctx)`
`801`	`799`	`private readonly IHost _host;`
`802`	`800`	`private readonly ColumnOptions[] _infos;`
`803`	`801`
`804`		`- /// <include file='doc.xml' path='doc/members/member[@name="Whitening"]/*'/>`
`805`	`802`	`/// <param name="env">The environment.</param>`
`806`	`803`	`/// <param name="columns">Describes the parameters of the whitening process for each column pair.</param>`
`807`	`804`	`internal VectorWhiteningEstimator(IHostEnvironment env, params ColumnOptions[] columns)`
`@@ -810,7 +807,6 @@ internal VectorWhiteningEstimator(IHostEnvironment env, params ColumnOptions[] c`
`810`	`807`	`_infos = columns;`
`811`	`808`	`}`
`812`	`809`
`813`		`- /// <include file='doc.xml' path='doc/members/member[@name="Whitening"]/*'/>`
`814`	`810`	`/// <param name="env">The environment.</param>`
`815`	`811`	`/// <param name="outputColumnName">Name of the column resulting from the transformation of <paramref name="inputColumnName"/>.</param>`
`816`	`812`	`/// <param name="inputColumnName">Name of column to transform. If set to <see langword="null"/>, the value of the <paramref name="outputColumnName"/> will be used as source.</param>`