ReconfigurablePrediction

Ivan Matantsev · Ivan Matantsev · commit f85cd9cc9acd · 2018-08-06T14:41:55.000-07:00
and shorter execution
diff --git a/test/Microsoft.ML.Tests/Scenarios/Api/CrossValidation.cs b/test/Microsoft.ML.Tests/Scenarios/Api/CrossValidation.cs
@@ -34,7 +34,8 @@ void CrossValidation()
                 // Train.
                 var trainer = new LinearClassificationTrainer(env, new LinearClassificationTrainer.Arguments
                 {
-                    NumThreads = 1
+                    NumThreads = 1,
+                    ConvergenceTolerance = 1f
                 });
 
                 // Auto-caching.
diff --git a/test/Microsoft.ML.Tests/Scenarios/Api/Evaluation.cs b/test/Microsoft.ML.Tests/Scenarios/Api/Evaluation.cs
@@ -1,9 +1,5 @@
 ﻿using Microsoft.ML.Runtime.Data;
 using Microsoft.ML.Runtime.Learners;
-using Microsoft.ML.Runtime.Api;
-using System;
-using System.Collections.Generic;
-using System.Text;
 using Xunit;
 using Microsoft.ML.Models;
 
diff --git a/test/Microsoft.ML.Tests/Scenarios/Api/ReconfigurablePrediction.cs b/test/Microsoft.ML.Tests/Scenarios/Api/ReconfigurablePrediction.cs
@@ -0,0 +1,60 @@
+﻿using Microsoft.ML.Models;
+using Microsoft.ML.Runtime.Data;
+using Microsoft.ML.Runtime.Learners;
+using Xunit;
+
+namespace Microsoft.ML.Tests.Scenarios.Api
+{
+    public partial class ApiScenariosTests
+    {
+        /// <summary>
+        /// Reconfigurable predictions: The following should be possible: A user trains a binary classifier,
+        /// and through the test evaluator gets a PR curve, the based on the PR curve picks a new threshold
+        /// and configures the scorer (or more precisely instantiates a new scorer over the same predictor)
+        /// with some threshold derived from that.
+        /// </summary>
+        [Fact]
+        void ReconfigurablePrediction()
+        {
+            var dataPath = GetDataPath(SentimentDataPath);
+            var testDataPath = GetDataPath(SentimentTestPath);
+
+            using (var env = new TlcEnvironment(seed: 1, conc: 1))
+            {
+                // Pipeline
+                var loader = new TextLoader(env, MakeSentimentTextLoaderArgs(), new MultiFileSource(dataPath));
+
+                var trans = TextTransform.Create(env, MakeSentimentTextTransformArgs(), loader);
+
+                // Train
+                var trainer = new LinearClassificationTrainer(env, new LinearClassificationTrainer.Arguments
+                {
+                    NumThreads = 1
+                });
+
+                var cached = new CacheDataView(env, trans, prefetch: null);
+                var trainRoles = new RoleMappedData(cached, label: "Label", feature: "Features");
+                var predictor = trainer.Train(new Runtime.TrainContext(trainRoles));
+                var scoreRoles = new RoleMappedData(trans, label: "Label", feature: "Features");
+                IDataScorerTransform scorer = ScoreUtils.GetScorer(predictor, scoreRoles, env, trainRoles.Schema);
+
+                var dataEval = new RoleMappedData(scorer, label: "Label", feature: "Features", opt: true);
+
+                var evaluator = new BinaryClassifierMamlEvaluator(env, new BinaryClassifierMamlEvaluator.Arguments() { });
+                var metricsDict = evaluator.Evaluate(dataEval);
+
+                var metrics = BinaryClassificationMetrics.FromMetrics(env, metricsDict["OverallMetrics"], metricsDict["ConfusionMatrix"])[0];
+
+                var bindable = ScoreUtils.GetSchemaBindableMapper(env, predictor, null);
+                var mapper = bindable.Bind(env, trainRoles.Schema);
+                var newScorer = new BinaryClassifierScorer(env, new BinaryClassifierScorer.Arguments { Threshold = 0.01f, ThresholdColumn = DefaultColumnNames.Probability },
+                    scoreRoles.Data, mapper, trainRoles.Schema);
+
+                dataEval = new RoleMappedData(newScorer, label: "Label", feature: "Features", opt: true);
+                var new_evaluator = new BinaryClassifierMamlEvaluator(env, new BinaryClassifierMamlEvaluator.Arguments() { Threshold = 0.01f, UseRawScoreThreshold = false });
+                metricsDict = new_evaluator.Evaluate(dataEval);
+                var new_metrics = BinaryClassificationMetrics.FromMetrics(env, metricsDict["OverallMetrics"], metricsDict["ConfusionMatrix"])[0];
+            }
+        }
+    }
+}

Original file line number	Diff line number	Diff line change
`@@ -34,7 +34,8 @@ void CrossValidation()`
`34`	`34`	`// Train.`
`35`	`35`	`var trainer = new LinearClassificationTrainer(env, new LinearClassificationTrainer.Arguments`
`36`	`36`	`{`
`37`		`- NumThreads = 1`
	`37`	`+ NumThreads = 1,`
	`38`	`+ ConvergenceTolerance = 1f`
`38`	`39`	`});`
`39`	`40`
`40`	`41`	`// Auto-caching.`