dotnet
diff --git a/‎machine-learning/tutorials/SentimentAnalysis/Program.cs‎
Lines changed: 164 additions & 80 deletions b/‎machine-learning/tutorials/SentimentAnalysis/Program.cs‎
Lines changed: 164 additions & 80 deletions
diff --git a/‎machine-learning/tutorials/SentimentAnalysis/SentimentAnalysis.csproj‎
Lines changed: 4 additions & 1 deletion b/‎machine-learning/tutorials/SentimentAnalysis/SentimentAnalysis.csproj‎
Lines changed: 4 additions & 1 deletion
diff --git a/‎machine-learning/tutorials/SentimentAnalysis/SentimentData.cs‎
Lines changed: 8 additions & 2 deletions b/‎machine-learning/tutorials/SentimentAnalysis/SentimentData.cs‎
Lines changed: 8 additions & 2 deletions
@@ -3,102 +3,126 @@
 using System.Collections.Generic;
 using System.IO;
 using System.Linq;
-using System.Threading.Tasks;
-using Microsoft.ML.Legacy;
-using Microsoft.ML.Legacy.Models;
-using Microsoft.ML.Legacy.Data;
-using Microsoft.ML.Legacy.Transforms;
-using Microsoft.ML.Legacy.Trainers;
+using Microsoft.ML;
+using Microsoft.ML.Core.Data;
 using Microsoft.ML.Runtime.Api;
+using Microsoft.ML.Runtime.Data;
+using Microsoft.ML.Transforms.Text;
 // </Snippet1>
 
 namespace SentimentAnalysis
 {
     class Program
     {
         // <Snippet2>
-        static readonly string _dataPath = Path.Combine(Environment.CurrentDirectory, "Data", "wikipedia-detox-250-line-data.tsv");
+        static readonly string _trainDataPath = Path.Combine(Environment.CurrentDirectory, "Data", "wikipedia-detox-250-line-data.tsv");
         static readonly string _testDataPath = Path.Combine(Environment.CurrentDirectory, "Data", "wikipedia-detox-250-line-test.tsv");
-        static readonly string _modelpath = Path.Combine(Environment.CurrentDirectory, "Data", "Model.zip");
+        static readonly string _modelPath = Path.Combine(Environment.CurrentDirectory, "Data", "Model.zip");
+        static TextLoader _textLoader;
         // </Snippet2>
 
-        static async Task Main(string[] args)
+        static void Main(string[] args)
         {
+            // Create ML.NET context/local environment - allows you to add steps in order to keep everything together 
+            // during the learning process.  
+            //Create ML Context with seed for repeatable/deterministic results
             // <Snippet3>
-            var model = await Train();
+            MLContext mlContext = new MLContext(seed: 0);
             // </Snippet3>
 
-            // <Snippet12>
-            Evaluate(model);
-            // </Snippet12>
-            
-            // <Snippet17>
-            Predict(model);
-            // </Snippet17>
-        }
+            // The TextLoader loads a dataset with comments and corresponding postive or negative sentiment. 
+            // When you create a loader, you specify the schema by passing a class to the loader containing
+            // all the column names and their types. This is used to create the model, and train it. 
+            // Initialize our TextLoader
+            // <Snippet4>
+            _textLoader = mlContext.Data.TextReader(new TextLoader.Arguments()
+                                                {
+                                                    Separator = "tab",
+                                                    HasHeader = true,
+                                                    Column = new[]
+                                                                {
+                                                                  new TextLoader.Column("Label", DataKind.Bool, 0),
+                                                                  new TextLoader.Column("SentimentText", DataKind.Text, 1)
+                                                                }
+                                                }
+            );
+            // </Snippet4>
 
-        public static async Task<PredictionModel<SentimentData, SentimentPrediction>> Train()
-        {
-            // LearningPipeline allows you to add steps in order to keep everything together 
-            // during the learning process.  
             // <Snippet5>
-            var pipeline = new LearningPipeline();
+            var model = Train(mlContext, _trainDataPath);
             // </Snippet5>
 
-            // The TextLoader loads a dataset with comments and corresponding postive or negative sentiment. 
-            // When you create a loader, you specify the schema by passing a class to the loader containing
-            // all the column names and their types. This is used to create the model, and train it. 
+            // <Snippet11>
+            Evaluate(mlContext, model);
+            // </Snippet11>
+            
+            // <Snippet16>
+            Predict(mlContext, model);
+            // </Snippet16>
+
+            // <Snippet25>
+            PredictWithModelLoadedFromFile(mlContext);
+            // <Snippet25>
+
+            Console.WriteLine();
+            Console.WriteLine("=============== End of process ===============");
+        }
+
+        public static ITransformer Train(MLContext mlContext, string dataPath)
+        {
+            //Note that this case, loading your training data from a file, 
+            //is the easiest way to get started, but ML.NET also allows you 
+            //to load data from databases or in-memory collections.
             // <Snippet6>
-            pipeline.Add(new TextLoader(_dataPath).CreateFrom<SentimentData>());
+            IDataView dataView =_textLoader.Read(dataPath);
             // </Snippet6>
 
-            // TextFeaturizer is a transform that is used to featurize an input column. 
-            // This is used to format and clean the data.
+            // Create a flexible pipeline (composed by a chain of estimators) for creating/training the model.
+            // This is used to format and clean the data.  
+            // Convert the text column to numeric vectors (Features column) 
             // <Snippet7>
-            pipeline.Add(new TextFeaturizer("Features", "SentimentText"));
-            //</Snippet7>
+            var pipeline = mlContext.Transforms.Text.FeaturizeText("SentimentText", "Features")
+             //</Snippet7>
 
-            // Adds a FastTreeBinaryClassifier, the decision tree learner for this project, and 
-            // three hyperparameters to be used for tuning decision tree performance.
-            // <Snippet8>
-            pipeline.Add(new FastTreeBinaryClassifier() { NumLeaves = 50, NumTrees = 50, MinDocumentsInLeafs = 20 });
+            // Adds a FastTreeBinaryClassificationTrainer, the decision tree learner for this project  
+            // <Snippet8> 
+                    .Append(mlContext.BinaryClassification.Trainers.FastTree(numLeaves: 50, numTrees: 50, minDatapointsInLeafs: 20));
             // </Snippet8>
 
-            // Train the pipeline based on the dataset that has been loaded, transformed.
+            // Create and train the model based on the dataset that has been loaded, transformed.
             // <Snippet9>
-            PredictionModel<SentimentData, SentimentPrediction> model =
-                pipeline.Train<SentimentData, SentimentPrediction>();
+            Console.WriteLine("=============== Create and Train the Model ===============");
+            var model = pipeline.Fit(dataView);
+            Console.WriteLine("=============== End of training ===============");
+            Console.WriteLine();
             // </Snippet9>
 
-            // Saves the model we trained to a zip file.
-            // <Snippet10>
-            await model.WriteAsync(_modelpath);
-            // </Snippet10>
-
             // Returns the model we trained to use for evaluation.
-            // <Snippet11>
+            // <Snippet10>
             return model;
-            // </Snippet11>
+            // </Snippet10>
         }
 
-        public static void Evaluate(PredictionModel<SentimentData, SentimentPrediction> model)
+        public static void Evaluate(MLContext mlContext, ITransformer model)
         {
-            // Evaluates.
+            // Evaluate the model and show accuracy stats
+            // Load evaluation/test data
+            // <Snippet12>
+            IDataView dataView = _textLoader.Read(_testDataPath);
+            // </Snippet12>
+
+            //Take the data in, make transformations, output the data. 
             // <Snippet13>
-            var testData = new TextLoader(_testDataPath).CreateFrom<SentimentData>();
+            Console.WriteLine("=============== Evaluating Model accuracy with Test data===============");
+            var predictions = model.Transform(dataView);
             // </Snippet13>
 
-            // BinaryClassificationEvaluator computes the quality metrics for the PredictionModel
-            // using the specified data set.
+            // BinaryClassificationContext.Evaluate returns a BinaryClassificationEvaluator.CalibratedResult
+            // that contains the computed overall metrics.
             // <Snippet14>
-            var evaluator = new BinaryClassificationEvaluator();
+            var metrics = mlContext.BinaryClassification.Evaluate(predictions, "Label");
             // </Snippet14>
 
-            // BinaryClassificationMetrics contains the overall metrics computed by binary classification evaluators.
-            // <Snippet15>
-            BinaryClassificationMetrics metrics = evaluator.Evaluate(model, testData);
-            // </Snippet15>
-
             // The Accuracy metric gets the accuracy of a classifier, which is the proportion 
             // of correct predictions in the test set.
 
@@ -111,57 +135,117 @@ public static void Evaluate(PredictionModel<SentimentData, SentimentPrediction>
             // The F1 score is the harmonic mean of precision and recall:
             //  2 * precision * recall / (precision + recall).
 
-            // <Snippet16>
+            // <Snippet15>
             Console.WriteLine();
-            Console.WriteLine("PredictionModel quality metrics evaluation");
-            Console.WriteLine("------------------------------------------");
+            Console.WriteLine("Model quality metrics evaluation");
+            Console.WriteLine("--------------------------------");
             Console.WriteLine($"Accuracy: {metrics.Accuracy:P2}");
             Console.WriteLine($"Auc: {metrics.Auc:P2}");
             Console.WriteLine($"F1Score: {metrics.F1Score:P2}");
-            // </Snippet16>
+            Console.WriteLine("=============== End of model evaluation ===============");
+            //</Snippet15>
+
+            // Save the new model to .ZIP file
+            // <Snippet23>
+            SaveModelAsFile(mlContext, model);
+            // </Snippet23>
         }
 
-        public static void Predict(PredictionModel<SentimentData, SentimentPrediction> model)
+        private static void Predict(MLContext mlContext, ITransformer model)
         {
-            // Adds some comments to test the trained model's predictions.
+            // <Snippet17>
+            var predictionFunction = model.MakePredictionFunction<SentimentData, SentimentPrediction>(mlContext);
+            // </Snippet17>
+
             // <Snippet18>
+            SentimentData sampleStatement = new SentimentData
+            {
+                SentimentText = "This is a very rude movie"
+            };
+            // </Snippet18>
+
+            // <Snippet19>
+            var resultprediction = predictionFunction.Predict(sampleStatement);
+            // </Snippet19>
+            // <Snippet20>
+            Console.WriteLine();
+            Console.WriteLine("=============== Prediction Test of model with a single sample and test dataset ===============");
+
+            Console.WriteLine();
+            Console.WriteLine($"Sentiment: {sampleStatement.SentimentText} | Prediction: {(Convert.ToBoolean(resultprediction.Prediction) ? "Toxic" : "Not Toxic")} | Probability: {resultprediction.Probability} ");
+            Console.WriteLine("=============== End of Predictions ===============");
+            Console.WriteLine();
+            // </Snippet20>
+        }
+
+        public static void PredictWithModelLoadedFromFile(MLContext mlContext)
+        {
+            // Adds some comments to test the trained model's predictions.
+            // <Snippet26>
             IEnumerable<SentimentData> sentiments = new[]
             {
                 new SentimentData
                 {
-                    SentimentText = "Please refrain from adding nonsense to Wikipedia."
+                    SentimentText = "This is a very rude movie"
                 },
                 new SentimentData
                 {
                     SentimentText = "He is the best, and the article should say that."
                 }
             };
-            // </Snippet18>
+            // </Snippet26>
 
-            // Use the model to predict the positive 
-            // or negative sentiment of the comment data.
-            // <Snippet19>
-            IEnumerable<SentimentPrediction> predictions = model.Predict(sentiments);
-            // </Snippet19>
+            // <Snippet27>
+            ITransformer loadedModel;
+            using (var stream = new FileStream(_modelPath, FileMode.Open, FileAccess.Read, FileShare.Read))
+            {
+                loadedModel = mlContext.Model.Load(stream);
+            }
+            // </Snippet27>
+
+            // <Snippet28>
+            // Create prediction engine
+            var sentimentStreamingDataView = mlContext.CreateStreamingDataView(sentiments);
+            var predictions = loadedModel.Transform(sentimentStreamingDataView);
+            
+            // Use the model to predict whether comment data is toxic (1) or nice (0).
+            var predictedResults = predictions.AsEnumerable<SentimentPrediction>(mlContext, reuseRowObject: false);
+            // </Snippet28>
+
+            // <Snippet29>
+            Console.WriteLine();
+
+            Console.WriteLine("=============== Prediction Test of loaded model with a multiple samples ===============");
+            // </Snippet29>
 
-            // <Snippet20>
             Console.WriteLine();
-            Console.WriteLine("Sentiment Predictions");
-            Console.WriteLine("---------------------");
-            // </Snippet20>
 
             // Builds pairs of (sentiment, prediction)
-            // <Snippet21>
-            var sentimentsAndPredictions = sentiments.Zip(predictions, (sentiment, prediction) => (sentiment, prediction));
-            // </Snippet21>
+            // <Snippet30>
+            var sentimentsAndPredictions = sentiments.Zip(predictedResults, (sentiment, prediction) => (sentiment, prediction));
+            // </Snippet30>
 
-            // <Snippet22>
+            // <Snippet31>
             foreach (var item in sentimentsAndPredictions)
             {
-                Console.WriteLine($"Sentiment: {item.sentiment.SentimentText} | Prediction: {(item.prediction.Sentiment ? "Negative" : "Positive")}");
+                Console.WriteLine($"Sentiment: {item.sentiment.SentimentText} | Prediction: {(Convert.ToBoolean(item.prediction.Prediction) ? "Toxic" : "Not Toxic")} | Probability: {item.prediction.Probability} ");
             }
-            Console.WriteLine();
-            // </Snippet22>          
+            Console.WriteLine("=============== End of predictions ===============");
+
+            // </Snippet31>          
+        }
+
+        // Saves the model we trained to a zip file.
+
+        private static void SaveModelAsFile(MLContext mlContext, ITransformer model)
+        {
+            // <Snippet24> 
+            using (var fs = new FileStream(_modelPath, FileMode.Create, FileAccess.Write, FileShare.Write))
+                mlContext.Model.Save(model,fs);
+            // </Snippet24>
+
+            Console.WriteLine("The model is saved to {0}", _modelPath);
         }
+        
     }
 }
@@ -14,10 +14,13 @@
   </ItemGroup>
 
   <ItemGroup>
-    <PackageReference Include="Microsoft.ML" Version="0.6.0" />
+    <PackageReference Include="Microsoft.ML" Version="0.7.0" />
   </ItemGroup>
 
   <ItemGroup>
+    <None Update="Data\wikipedia-detox-250-line-all.tsv">
+      <CopyToOutputDirectory>PreserveNewest</CopyToOutputDirectory>
+    </None>
     <None Update="Data\wikipedia-detox-250-line-data.tsv">
       <CopyToOutputDirectory>PreserveNewest</CopyToOutputDirectory>
     </None>
 
@@ -16,7 +16,13 @@ public class SentimentData
     public class SentimentPrediction
     {
         [ColumnName("PredictedLabel")]
-        public bool Sentiment;
+        public bool Prediction { get; set; }
+
+        [ColumnName("Probability")]
+        public float Probability { get; set; }
+
+        [ColumnName("Score")]
+        public float Score { get; set; }
     }
     // </Snippet2>
-}
+}