Added Accuracy Reporting

dotnet · KrzysztofCwalina · May 15, 2018 · May 7, 2018 · May 8, 2018 · May 8, 2018
commit 1647ef59d4b33c582786eecda570bfea65fa7ca8
diff --git a/test/Microsoft.ML.Benchmarks/Microsoft.ML.Benchmarks.csproj b/test/Microsoft.ML.Benchmarks/Microsoft.ML.Benchmarks.csproj
@@ -5,6 +5,11 @@
     <TargetFramework>netcoreapp2.0</TargetFramework>
     <StartupObject>Microsoft.ML.Benchmarks.Program</StartupObject>
   </PropertyGroup>
+  <ItemGroup>
+    <Compile Remove="BenchmarkDotNet.Artifacts\**" />
+    <EmbeddedResource Remove="BenchmarkDotNet.Artifacts\**" />
+    <None Remove="BenchmarkDotNet.Artifacts\**" />
+  </ItemGroup>
   <ItemGroup>
     <PackageReference Include="BenchmarkDotNet" Version="0.10.14" />
   </ItemGroup>

diff --git a/test/Microsoft.ML.Benchmarks/Program.cs b/test/Microsoft.ML.Benchmarks/Program.cs
@@ -6,9 +6,17 @@
 using BenchmarkDotNet.Diagnosers;
 using BenchmarkDotNet.Jobs;
 using BenchmarkDotNet.Running;
+using BenchmarkDotNet.Columns;
+using BenchmarkDotNet.Reports;
 using BenchmarkDotNet.Toolchains.CsProj;
 using BenchmarkDotNet.Toolchains.InProcess;
+using System;
 using System.IO;
+using Microsoft.ML.Models;
+using Microsoft.ML.Runtime.Api;
+using Microsoft.ML.Trainers;
+using Microsoft.ML.Transforms;
+using Microsoft.ML.Benchmarks;
 
 namespace Microsoft.ML.Benchmarks
 {
@@ -30,6 +38,7 @@ private static IConfig CreateClrVsCoreConfig()
             var config = DefaultConfig.Instance.With(
                 Job.ShortRun.
                 With(InProcessToolchain.Instance)).
+                With(new ClassificationMetricsColumn("AccuracyMacro", "Macro-average accuracy of the model")).
                 With(MemoryDiagnoser.Default);
             return config;
         }
@@ -45,4 +54,37 @@ static Program()
             _dataRoot = Path.Combine(rootDir, "test", "data");
         }
     }
+
+
+    public class ClassificationMetricsColumn : IColumn
+    {
+        string _metricName;
+        string _legend;
+
+        public ClassificationMetricsColumn(string metricName, string legend)
+        {
+            _metricName = metricName;
+            _legend = legend;
+        }
+
+        public string ColumnName => _metricName;
+        public string Id => _metricName;
+        public string Legend => _legend;
+        public bool IsNumeric => true;
+        public bool IsDefault(Summary summary, Benchmark benchmark) => true;
+        public bool IsAvailable(Summary summary) => true;
+        public bool AlwaysShow => true;
+        public ColumnCategory Category => ColumnCategory.Custom;
+        public int PriorityInCategory => 1;
+        public UnitType UnitType => UnitType.Dimensionless;
+
+        public string GetValue(Summary summary, Benchmark benchmark, ISummaryStyle style)
+        {
+            var property = typeof(ClassificationMetrics).GetProperty(_metricName);
+            return property.GetValue(TrainPredictionBench.s_metrics).ToString();
+        }
+        public string GetValue(Summary summary, Benchmark benchmark) => GetValue(summary, benchmark, null);
+
+        public override string ToString() => ColumnName;
+    }
 }
diff --git a/test/Microsoft.ML.Benchmarks/TrainPredictionBench.cs b/test/Microsoft.ML.Benchmarks/TrainPredictionBench.cs
@@ -3,16 +3,28 @@
 // See the LICENSE file in the project root for more information.
 
 using BenchmarkDotNet.Attributes;
+using BenchmarkDotNet.Running;
+using Microsoft.ML.Models;
 using Microsoft.ML.Runtime.Api;
 using Microsoft.ML.Trainers;
 using Microsoft.ML.Transforms;
 
-
 namespace Microsoft.ML.Benchmarks
 {
-    [KeepBenchmarkFiles]
     public class TrainPredictionBench
     {
+        internal static ClassificationMetrics s_metrics;
+        static PredictionModel<IrisData, IrisPrediction> s_trainedModel;
+
+        [GlobalCleanup]
+        public void Accuracy()
+        {
+            var dataPath = Program.GetDataPath("iris.txt");
+            var testData = new TextLoader<IrisData>(dataPath, useHeader: true, separator: "tab");
+            var evaluator = new ClassificationEvaluator();
+            s_metrics = evaluator.Evaluate(s_trainedModel, testData);
+        }
+
         [Benchmark]
         public void Iris()
         {
@@ -50,6 +62,8 @@ public void Iris()
                 PetalLength = 1.2f,
                 PetalWidth = 4.4f,
             });
+
+            s_trainedModel = model;
         }
 
         public class IrisData