Skip to content

Commit 5707e17

Browse files
author
Ivan Matantsev
committed
add key transform to benchmark
1 parent 9dff7be commit 5707e17

File tree

2 files changed

+11
-6
lines changed

2 files changed

+11
-6
lines changed

test/Microsoft.ML.Benchmarks/PredictionEngineBench.cs

+3-2
Original file line numberDiff line numberDiff line change
@@ -58,8 +58,9 @@ public void SetupIrisPipeline()
5858
IDataView data = loader.Load(_irisDataPath);
5959

6060
var pipeline = new ColumnConcatenatingEstimator(env, "Features", new[] { "SepalLength", "SepalWidth", "PetalLength", "PetalWidth" })
61+
.Append(env.Transforms.Conversion.MapValueToKey("Label"))
6162
.Append(env.MulticlassClassification.Trainers.StochasticDualCoordinateAscent(
62-
new SdcaMultiClassTrainer.Options {NumThreads = 1, ConvergenceTolerance = 1e-2f, }));
63+
new SdcaMultiClassTrainer.Options { NumThreads = 1, ConvergenceTolerance = 1e-2f, }));
6364

6465
var model = pipeline.Fit(data);
6566

@@ -94,7 +95,7 @@ public void SetupSentimentPipeline()
9495

9596
var pipeline = mlContext.Transforms.Text.FeaturizeText("Features", "SentimentText")
9697
.Append(mlContext.BinaryClassification.Trainers.StochasticDualCoordinateAscentNonCalibrated(
97-
new SdcaNonCalibratedBinaryTrainer.Options {NumThreads = 1, ConvergenceTolerance = 1e-2f, }));
98+
new SdcaNonCalibratedBinaryTrainer.Options { NumThreads = 1, ConvergenceTolerance = 1e-2f, }));
9899

99100
var model = pipeline.Fit(data);
100101

test/Microsoft.ML.Benchmarks/StochasticDualCoordinateAscentClassifierBench.cs

+8-4
Original file line numberDiff line numberDiff line change
@@ -71,6 +71,7 @@ private TransformerChain<MulticlassPredictionTransformer<MulticlassLogisticRegre
7171
IDataView data = loader.Load(dataPath);
7272

7373
var pipeline = new ColumnConcatenatingEstimator(mlContext, "Features", new[] { "SepalLength", "SepalWidth", "PetalLength", "PetalWidth" })
74+
.Append(mlContext.Transforms.Conversion.MapValueToKey("Label"))
7475
.Append(mlContext.MulticlassClassification.Trainers.StochasticDualCoordinateAscent());
7576

7677
return pipeline.Fit(data);
@@ -93,8 +94,9 @@ public void TrainSentiment()
9394
};
9495

9596
var loader = mlContext.Data.LoadFromTextFile(_sentimentDataPath, arguments);
96-
var text = mlContext.Transforms.Text.FeaturizeText("WordEmbeddings", new List<string> { "SentimentText" },
97-
new TextFeaturizingEstimator.Options {
97+
var text = mlContext.Transforms.Text.FeaturizeText("WordEmbeddings", new List<string> { "SentimentText" },
98+
new TextFeaturizingEstimator.Options
99+
{
98100
OutputTokens = true,
99101
KeepPunctuations = false,
100102
UseStopRemover = true,
@@ -103,8 +105,10 @@ public void TrainSentiment()
103105
UseWordExtractor = false,
104106
}).Fit(loader).Transform(loader);
105107

106-
var trans = mlContext.Transforms.Text.ExtractWordEmbeddings("Features", "WordEmbeddings_TransformedText",
107-
WordEmbeddingsExtractingEstimator.PretrainedModelKind.Sswe).Fit(text).Transform(text);
108+
var trans = mlContext.Transforms.Text.ExtractWordEmbeddings("Features", "WordEmbeddings_TransformedText",
109+
WordEmbeddingsExtractingEstimator.PretrainedModelKind.Sswe)
110+
.Append(mlContext.Transforms.Conversion.MapValueToKey("Label"))
111+
.Fit(text).Transform(text);
108112

109113
// Train
110114
var trainer = mlContext.MulticlassClassification.Trainers.StochasticDualCoordinateAscent();

0 commit comments

Comments
 (0)