Addressed reviewers' comments.

zeahmed · zeahmed · commit 9c07a53e1cfd · 2018-10-04T16:18:37.000-07:00
diff --git a/src/Microsoft.ML.Legacy/CSharpApi.cs b/src/Microsoft.ML.Legacy/CSharpApi.cs
@@ -15804,7 +15804,12 @@ public sealed partial class TensorFlowScorer : Microsoft.ML.Runtime.EntryPoints.
             /// <summary>
             /// Training labels.
             /// </summary>
-            public string LabeLColumn { get; set; } = "Label";
+            public string LabelColumn { get; set; }
+
+            /// <summary>
+            /// TensorFlow label node.
+            /// </summary>
+            public string TensorFlowLabel { get; set; }
 
             /// <summary>
             /// The name of the optimization operation in the TensorFlow graph.
diff --git a/src/Microsoft.ML.TensorFlow/TensorFlow/Tensor.cs b/src/Microsoft.ML.TensorFlow/TensorFlow/Tensor.cs
@@ -436,13 +436,15 @@ internal static unsafe TFTensor CreateString(byte[] buffer)
             // Clear offset table
             IntPtr dst = TF_TensorData(handle);
             Marshal.WriteInt64(dst, 0);
-            var status = new TFStatus();
-            fixed (byte* src = &buffer[0])
+            using (var status = new TFStatus())
             {
-                TF_StringEncode(src, (UIntPtr)buffer.Length, (sbyte*)(dst + 8), size, status.handle);
-                var ok = status.StatusCode == TFCode.Ok;
-                if (!ok)
-                    return null;
+                fixed (byte* src = &buffer[0])
+                {
+                    TF_StringEncode(src, (UIntPtr)buffer.Length, (sbyte*)(dst + 8), size, status.handle);
+                    var ok = status.StatusCode == TFCode.Ok;
+                    if (!ok)
+                        return null;
+                }
             }
             return new TFTensor(handle);
         }
diff --git a/src/Microsoft.ML.TensorFlow/TensorFlow/Tensorflow.cs b/src/Microsoft.ML.TensorFlow/TensorFlow/Tensorflow.cs
@@ -290,7 +290,7 @@ public TFStatus() : base(TF_NewStatus())
 
         // extern void TF_DeleteStatus (TF_Status *);
         [DllImport(NativeBinding.TensorFlowLibrary)]
-        internal static extern unsafe void TF_DeleteStatus(TF_Status status);
+        private static extern unsafe void TF_DeleteStatus(TF_Status status);
 
         internal override void NativeDispose(IntPtr handle)
         {
@@ -313,7 +313,7 @@ public void SetStatusCode(TFCode code, string msg)
 
         // extern TF_Code TF_GetCode (const TF_Status *s);
         [DllImport(NativeBinding.TensorFlowLibrary)]
-        internal static extern unsafe TFCode TF_GetCode(TF_Status s);
+        private static extern unsafe TFCode TF_GetCode(TF_Status s);
 
         /// <summary>
         /// Gets the status code for the status code.
diff --git a/src/Microsoft.ML.TensorFlow/TensorflowTransform.cs b/src/Microsoft.ML.TensorFlow/TensorflowTransform.cs
@@ -60,59 +60,65 @@ public sealed class Arguments : TransformInputBase
             public string[] OutputColumns;
 
             /// <summary>
-            /// The name of the column used as label for training.
+            /// The name of the label column in <see cref="IDataView"/> that will be mapped to label node in TensorFlow model.
             /// </summary>
             [Argument(ArgumentType.AtMostOnce, HelpText = "Training labels.", ShortName = "label", SortOrder = 4)]
-            public string LabeLColumn = DefaultColumnNames.Label;
+            public string LabelColumn;
+
+            /// <summary>
+            /// The name of the label in TensorFlow model.
+            /// </summary>
+            [Argument(ArgumentType.AtMostOnce, HelpText = "TensorFlow label node.", ShortName = "TFLabel", SortOrder = 5)]
+            public string TensorFlowLabel;
 
             /// <summary>
             /// Name of the operation in TensorFlow graph that is used for optimizing parameters in the graph.
             /// Usually it is the name specified in the minimize method of optimizer in python
             /// e.g. optimizer = tf.train.GradientDescentOptimizer(learning_rate).minimize(cost, name = "SGDOptimizer").
             /// </summary>
-            [Argument(ArgumentType.AtMostOnce, HelpText = "The name of the optimization operation in the TensorFlow graph.", ShortName = "OptimizationOp", SortOrder = 4)]
+            [Argument(ArgumentType.AtMostOnce, HelpText = "The name of the optimization operation in the TensorFlow graph.", ShortName = "OptimizationOp", SortOrder = 6)]
             public string OptimizationOperation;
 
             /// <summary>
             /// The name of the operation in the TensorFlow graph to compute training loss (Optional).
             /// </summary>
-            [Argument(ArgumentType.AtMostOnce, HelpText = "The name of the operation in the TensorFlow graph to compute training loss (Optional)", ShortName = "LossOp", SortOrder = 5)]
+            [Argument(ArgumentType.AtMostOnce, HelpText = "The name of the operation in the TensorFlow graph to compute training loss (Optional)", ShortName = "LossOp", SortOrder = 7)]
             public string LossOperation;
 
             /// <summary>
             /// The name of the operation in the TensorFlow graph to compute performance metric during training (Optional).
             /// </summary>
-            [Argument(ArgumentType.AtMostOnce, HelpText = "The name of the operation in the TensorFlow graph to compute performance metric during training (Optional)", ShortName = "MetricOp", SortOrder = 6)]
+            [Argument(ArgumentType.AtMostOnce, HelpText = "The name of the operation in the TensorFlow graph to compute performance metric during training (Optional)", ShortName = "MetricOp", SortOrder = 8)]
             public string MetricOperation;
 
             /// <summary>
             /// Number of samples to use for mini-batch training.
             /// </summary>
-            [Argument(ArgumentType.AtMostOnce, HelpText = "Number of samples to use for mini-batch training.", SortOrder = 7)]
+            [Argument(ArgumentType.AtMostOnce, HelpText = "Number of samples to use for mini-batch training.", SortOrder = 9)]
             public int BatchSize = 64;
 
             /// <summary>
             /// Number of training iterations.
             /// </summary>
-            [Argument(ArgumentType.AtMostOnce, HelpText = "Number of training iterations.", SortOrder = 8)]
+            [Argument(ArgumentType.AtMostOnce, HelpText = "Number of training iterations.", SortOrder = 10)]
             public int Epoch = 5;
 
             /// <summary>
             /// The name of the operation in the TensorFlow graph which sets optimizer learning rate (Optional).
             /// </summary>
-            [Argument(ArgumentType.AtMostOnce, HelpText = "The name of the operation in the TensorFlow graph which sets optimizer learning rate (Optional).", SortOrder = 9)]
+            [Argument(ArgumentType.AtMostOnce, HelpText = "The name of the operation in the TensorFlow graph which sets optimizer learning rate (Optional).", SortOrder = 11)]
             public string LearningRateOperation;
 
             /// <summary>
             /// Learning rate to use during optimization.
             /// </summary>
-            [Argument(ArgumentType.AtMostOnce, HelpText = "Learning rate to use during optimization.", SortOrder = 10)]
+            [Argument(ArgumentType.AtMostOnce, HelpText = "Learning rate to use during optimization.", SortOrder = 12)]
             public float LearningRate = 0.01f;
 
             /// <summary>
             /// Shuffle training data on each iteration?
             /// </summary>
-            [Argument(ArgumentType.AtMostOnce, HelpText = "Shuffle data before each iteration.", SortOrder = 11)]
+            [Argument(ArgumentType.AtMostOnce, HelpText = "Shuffle data before each iteration.", SortOrder = 13)]
             public bool Shuffle = true;
 
             /// <summary>
@@ -121,7 +127,7 @@ public sealed class Arguments : TransformInputBase
             /// Therefore, its highly unlikely that this parameter is changed from its default value of 'save/Const'.
             /// Please change it cautiously if you need to.
             /// </summary>
-            [Argument(ArgumentType.AtMostOnce, HelpText = "Name of the input in TensorFlow graph that specifiy the location for saving/restoring models from disk.", SortOrder = 12)]
+            [Argument(ArgumentType.AtMostOnce, HelpText = "Name of the input in TensorFlow graph that specifiy the location for saving/restoring models from disk.", SortOrder = 14)]
             public string SaveLocationOperation = "save/Const";
 
             /// <summary>
@@ -130,13 +136,13 @@ public sealed class Arguments : TransformInputBase
             /// Therefore, its highly unlikely that this parameter is changed from its default value of 'save/control_dependency'.
             /// Please change it cautiously if you need to.
             /// </summary>
-            [Argument(ArgumentType.AtMostOnce, HelpText = "Name of the input in TensorFlow graph that specifiy the location for saving/restoring models from disk.", SortOrder = 13)]
+            [Argument(ArgumentType.AtMostOnce, HelpText = "Name of the input in TensorFlow graph that specifiy the location for saving/restoring models from disk.", SortOrder = 15)]
             public string SaveOperation = "save/control_dependency";
 
             /// <summary>
             /// Needed for command line to specify if retraining is requested.
             /// </summary>
-            [Argument(ArgumentType.AtMostOnce, HelpText = "Retrain TensorFlow model.", SortOrder = 15)]
+            [Argument(ArgumentType.AtMostOnce, HelpText = "Retrain TensorFlow model.", SortOrder = 16)]
             public bool ReTrain = false;
         }
 
@@ -300,9 +306,9 @@ private void CheckParameters(Arguments args)
             if (Session.Graph[args.OptimizationOperation] == null)
                 throw _host.ExceptParam(nameof(args.OptimizationOperation), $"Optimization operation '{args.OptimizationOperation}' does not exist in the model");
 
-            _host.CheckNonWhiteSpace(args.LabeLColumn, nameof(args.LabeLColumn));
-            if (Session.Graph[args.LabeLColumn] == null)
-                throw _host.ExceptParam(nameof(args.LabeLColumn), $"'{args.LabeLColumn}' does not exist in the model");
+            _host.CheckNonWhiteSpace(args.TensorFlowLabel, nameof(args.TensorFlowLabel));
+            if (Session.Graph[args.TensorFlowLabel] == null)
+                throw _host.ExceptParam(nameof(args.TensorFlowLabel), $"'{args.TensorFlowLabel}' does not exist in the model");
 
             _host.CheckNonWhiteSpace(args.SaveLocationOperation, nameof(args.SaveLocationOperation));
             if (Session.Graph[args.SaveLocationOperation] == null)
@@ -334,6 +340,33 @@ private void CheckParameters(Arguments args)
             }
         }
 
+        private (int, bool, TFDataType, TFShape) GetInputMetaData(ISchema inputSchema, string columnName, string tfNodeName, int batchSize)
+        {
+            if (!inputSchema.TryGetColumnIndex(columnName, out int inputColIndices))
+                throw _host.Except($"Column {columnName} doesn't exist");
+
+            var type = inputSchema.GetColumnType(inputColIndices);
+            var isInputVector = type.IsVector;
+
+            var tfInput = new TFOutput(Graph[tfNodeName]);
+            var tfInputType = tfInput.OutputType;
+            var tfInputShape = Graph.GetTensorShape(tfInput);
+            if (tfInputShape.NumDimensions != -1)
+            {
+                var newShape = new long[tfInputShape.NumDimensions];
+                newShape[0] = tfInputShape[0] == -1 ? batchSize : tfInputShape[0];
+
+                for (int j = 1; j < tfInputShape.NumDimensions; j++)
+                    newShape[j] = tfInputShape[j];
+                tfInputShape = new TFShape(newShape);
+            }
+
+            var expectedType = TensorFlowUtils.Tf2MlNetType(tfInputType);
+            if (type.ItemType != expectedType)
+                throw _host.ExceptSchemaMismatch(nameof(inputSchema), "input", columnName, expectedType.ToString(), type.ToString());
+
+            return (inputColIndices, isInputVector, tfInputType, tfInputShape);
+        }
         private void TrainCore(Arguments args, string model, IDataView input)
         {
             var inputsForTraining = new string[Inputs.Length + 1];
@@ -347,35 +380,18 @@ private void TrainCore(Arguments args, string model, IDataView input)
                 inputsForTraining[i] = Inputs[i];
             }
 
-            inputsForTraining[inputsForTraining.Length - 1] = args.LabeLColumn;
-
             var inputSchema = input.Schema;
-            for (int i = 0; i < inputsForTraining.Length; i++)
+            for (int i = 0; i < inputsForTraining.Length - 1; i++)
             {
-                if (!inputSchema.TryGetColumnIndex(inputsForTraining[i], out inputColIndices[i]))
-                    throw _host.Except($"Column {inputsForTraining[i]} doesn't exist");
-
-                var type = inputSchema.GetColumnType(inputColIndices[i]);
-                isInputVector[i] = type.IsVector;
-
-                var tfInput = new TFOutput(Graph[inputsForTraining[i]]);
-                tfInputTypes[i] = tfInput.OutputType;
-                tfInputShapes[i] = Graph.GetTensorShape(tfInput);
-                if (tfInputShapes[i].NumDimensions != -1)
-                {
-                    var newShape = new long[tfInputShapes[i].NumDimensions];
-                    newShape[0] = tfInputShapes[i][0] == -1 ? args.BatchSize : tfInputShapes[i][0];
-
-                    for (int j = 1; j < tfInputShapes[i].NumDimensions; j++)
-                        newShape[j] = tfInputShapes[i][j];
-                    tfInputShapes[i] = new TFShape(newShape);
-                }
-
-                var expectedType = TensorFlowUtils.Tf2MlNetType(tfInputTypes[i]);
-                if (type.ItemType != expectedType)
-                    throw _host.ExceptSchemaMismatch(nameof(inputSchema), "input", inputsForTraining[i], expectedType.ToString(), type.ToString());
+                (inputColIndices[i], isInputVector[i], tfInputTypes[i], tfInputShapes[i]) =
+                    GetInputMetaData(inputSchema, inputsForTraining[i], inputsForTraining[i],args.BatchSize);
             }
 
+            var index = inputsForTraining.Length - 1;
+            inputsForTraining[index] = args.TensorFlowLabel;
+            (inputColIndices[index], isInputVector[index], tfInputTypes[index], tfInputShapes[index]) =
+                    GetInputMetaData(inputSchema, args.LabelColumn, inputsForTraining[index], args.BatchSize);
+
             var fetchList = new List<string>();
             if (args.LossOperation != null)
                 fetchList.Add(args.LossOperation);
diff --git a/test/BaselineOutput/Common/EntryPoints/core_manifest.json b/test/BaselineOutput/Common/EntryPoints/core_manifest.json
@@ -21773,7 +21773,7 @@
           "IsNullable": false
         },
         {
-          "Name": "LabeLColumn",
+          "Name": "LabelColumn",
           "Type": "String",
           "Desc": "Training labels.",
           "Aliases": [
@@ -21782,7 +21782,19 @@
           "Required": false,
           "SortOrder": 4.0,
           "IsNullable": false,
-          "Default": "Label"
+          "Default": null
+        },
+        {
+          "Name": "TensorFlowLabel",
+          "Type": "String",
+          "Desc": "TensorFlow label node.",
+          "Aliases": [
+            "TFLabel"
+          ],
+          "Required": false,
+          "SortOrder": 5.0,
+          "IsNullable": false,
+          "Default": null
         },
         {
           "Name": "OptimizationOperation",
@@ -21792,7 +21804,7 @@
             "OptimizationOp"
           ],
           "Required": false,
-          "SortOrder": 4.0,
+          "SortOrder": 6.0,
           "IsNullable": false,
           "Default": null
         },
@@ -21804,7 +21816,7 @@
             "LossOp"
           ],
           "Required": false,
-          "SortOrder": 5.0,
+          "SortOrder": 7.0,
           "IsNullable": false,
           "Default": null
         },
@@ -21816,7 +21828,7 @@
             "MetricOp"
           ],
           "Required": false,
-          "SortOrder": 6.0,
+          "SortOrder": 8.0,
           "IsNullable": false,
           "Default": null
         },
@@ -21825,7 +21837,7 @@
           "Type": "Int",
           "Desc": "Number of samples to use for mini-batch training.",
           "Required": false,
-          "SortOrder": 7.0,
+          "SortOrder": 9.0,
           "IsNullable": false,
           "Default": 64
         },
@@ -21834,7 +21846,7 @@
           "Type": "Int",
           "Desc": "Number of training iterations.",
           "Required": false,
-          "SortOrder": 8.0,
+          "SortOrder": 10.0,
           "IsNullable": false,
           "Default": 5
         },
@@ -21843,7 +21855,7 @@
           "Type": "String",
           "Desc": "The name of the operation in the TensorFlow graph which sets optimizer learning rate (Optional).",
           "Required": false,
-          "SortOrder": 9.0,
+          "SortOrder": 11.0,
           "IsNullable": false,
           "Default": null
         },
@@ -21852,7 +21864,7 @@
           "Type": "Float",
           "Desc": "Learning rate to use during optimization.",
           "Required": false,
-          "SortOrder": 10.0,
+          "SortOrder": 12.0,
           "IsNullable": false,
           "Default": 0.01
         },
@@ -21861,7 +21873,7 @@
           "Type": "Bool",
           "Desc": "Shuffle data before each iteration.",
           "Required": false,
-          "SortOrder": 11.0,
+          "SortOrder": 13.0,
           "IsNullable": false,
           "Default": true
         },
@@ -21870,7 +21882,7 @@
           "Type": "String",
           "Desc": "Name of the input in TensorFlow graph that specifiy the location for saving/restoring models from disk.",
           "Required": false,
-          "SortOrder": 12.0,
+          "SortOrder": 14.0,
           "IsNullable": false,
           "Default": "save/Const"
         },
@@ -21879,7 +21891,7 @@
           "Type": "String",
           "Desc": "Name of the input in TensorFlow graph that specifiy the location for saving/restoring models from disk.",
           "Required": false,
-          "SortOrder": 13.0,
+          "SortOrder": 15.0,
           "IsNullable": false,
           "Default": "save/control_dependency"
         },
@@ -21888,7 +21900,7 @@
           "Type": "Bool",
           "Desc": "Retrain TensorFlow model.",
           "Required": false,
-          "SortOrder": 15.0,
+          "SortOrder": 16.0,
           "IsNullable": false,
           "Default": false
         }
diff --git a/test/Microsoft.ML.Tests/ScenariosWithDirectInstantiation/TensorflowTests.cs b/test/Microsoft.ML.Tests/ScenariosWithDirectInstantiation/TensorflowTests.cs