eerhardt
diff --git a/‎src/Microsoft.ML.Core/EntryPoints/ModuleArgs.cs‎
Lines changed: 5 additions & 0 deletions b/‎src/Microsoft.ML.Core/EntryPoints/ModuleArgs.cs‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎src/Microsoft.ML.Core/EntryPoints/ModuleCatalog.cs‎
Lines changed: 2 additions & 0 deletions b/‎src/Microsoft.ML.Core/EntryPoints/ModuleCatalog.cs‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎src/Microsoft.ML.FastTree/FastTree.cs‎
Lines changed: 25 additions & 0 deletions b/‎src/Microsoft.ML.FastTree/FastTree.cs‎
Lines changed: 25 additions & 0 deletions
diff --git a/‎src/Microsoft.ML.FastTree/FastTreeClassification.cs‎
Lines changed: 5 additions & 1 deletion b/‎src/Microsoft.ML.FastTree/FastTreeClassification.cs‎
Lines changed: 5 additions & 1 deletion
diff --git a/‎src/Microsoft.ML.FastTree/FastTreeRanking.cs‎
Lines changed: 5 additions & 1 deletion b/‎src/Microsoft.ML.FastTree/FastTreeRanking.cs‎
Lines changed: 5 additions & 1 deletion
diff --git a/‎src/Microsoft.ML.FastTree/FastTreeRegression.cs‎
Lines changed: 5 additions & 1 deletion b/‎src/Microsoft.ML.FastTree/FastTreeRegression.cs‎
Lines changed: 5 additions & 1 deletion
diff --git a/‎src/Microsoft.ML.FastTree/FastTreeTweedie.cs‎
Lines changed: 9 additions & 3 deletions b/‎src/Microsoft.ML.FastTree/FastTreeTweedie.cs‎
Lines changed: 9 additions & 3 deletions
diff --git a/‎src/Microsoft.ML.FastTree/RandomForest.cs‎
Lines changed: 22 additions & 0 deletions b/‎src/Microsoft.ML.FastTree/RandomForest.cs‎
Lines changed: 22 additions & 0 deletions
diff --git a/‎src/Microsoft.ML.FastTree/RandomForestClassification.cs‎
Lines changed: 5 additions & 1 deletion b/‎src/Microsoft.ML.FastTree/RandomForestClassification.cs‎
Lines changed: 5 additions & 1 deletion
diff --git a/‎src/Microsoft.ML.FastTree/RandomForestRegression.cs‎
Lines changed: 5 additions & 1 deletion b/‎src/Microsoft.ML.FastTree/RandomForestRegression.cs‎
Lines changed: 5 additions & 1 deletion
@@ -527,6 +527,11 @@ public sealed class EntryPointAttribute : Attribute
             /// Short name of the Entry Point
             /// </summary>
             public string ShortName { get; set; }
+
+            /// <summary>
+            /// Remarks on the Entry Point, for more extensive XML documentation on the C#API
+            /// </summary>
+            public string Remarks { get; set; }
         }
 
         /// <summary>
 
@@ -44,6 +44,7 @@ public sealed class EntryPointInfo
             public readonly string Description;
             public readonly string ShortName;
             public readonly string FriendlyName;
+            public readonly string Remarks;
             public readonly MethodInfo Method;
             public readonly Type InputType;
             public readonly Type OutputType;
@@ -63,6 +64,7 @@ internal EntryPointInfo(IExceptionContext ectx, MethodInfo method,
                 Method = method;
                 ShortName = attribute.ShortName;
                 FriendlyName = attribute.UserName;
+                Remarks = attribute.Remarks;
                 ObsoleteAttribute = obsoleteAttribute;
 
                 // There are supposed to be 2 parameters, env and input for non-macro nodes.
 
@@ -82,6 +82,31 @@ public abstract class FastTreeTrainerBase<TArgs, TPredictor> :
 
         protected string InnerArgs => CmdParser.GetSettings(Host, Args, new TArgs());
 
+        internal const string Remarks = @"<remarks>
+<para>FastTrees is an efficient implementation of the <a href='https://arxiv.org/abs/1505.01866'>MART</a> gradient boosting algorithm. 
+Gradient boosting is a machine learning technique for regression problems. 
+It builds each regression tree in a step-wise fashion, using a predefined loss function to measure the error for each step and corrects for it in the next. 
+So this prediction model is actually an ensemble of weaker prediction models. In regression problems, boosting builds a series of of such trees in a step-wise fashion and then selects the optimal tree using an arbitrary differentiable loss function.
+</para>
+<para>
+MART learns an ensemble of regression trees, which is a decision tree with scalar values in its leaves. 
+A decision (or regression) tree is a binary tree-like flow chart, where at each interior node one decides which of the two child nodes to continue to based on one of the feature values from the input. 
+At each leaf node, a value is returned. In the interior nodes, the decision is based on the test 'x <= v' where x is the value of the feature in the input sample and v is one of the possible values of this feature. 
+The functions that can be produced by a regression tree are all the piece-wise constant functions.
+</para>
+<para>
+The ensemble of trees is produced by computing, in each step, a regression tree that approximates the gradient of the loss function, and adding it to the previous tree with coefficients that minimize the loss of the new tree.
+The output of the ensemble produced by MART on a given instance is the sum of the tree outputs.
+</para>
+<list type='bullet'>
+<item>In case of a binary classification problem, the output is converted to a probability by using some form of calibration.</item>
+<item>In case of a regression problem, the output is the predicted value of the function.</item>
+<item>In case of a ranking problem, the instances are ordered by the output value of the ensemble.</item>
+</list>
+<a href='https://en.wikipedia.org/wiki/Gradient_boosting#Gradient_tree_boosting'>Wikipedia: Gradient boosting (Gradient tree boosting)</a>.
+<a href='http://projecteuclid.org/DPubS?service=UI&version=1.0&verb=Display&handle=euclid.aos/1013203451'>Greedy function approximation: A gradient boosting machine.</a>.
+</remarks>";
+
         public override bool NeedNormalization => false;
 
         public override bool WantCaching => false;
 
@@ -338,7 +338,11 @@ public void AdjustTreeOutputs(IChannel ch, RegressionTree tree,
 
     public static partial class FastTree
     {
-        [TlcModule.EntryPoint(Name = "Trainers.FastTreeBinaryClassifier", Desc = FastTreeBinaryClassificationTrainer.Summary, UserName = FastTreeBinaryClassificationTrainer.UserNameValue, ShortName = FastTreeBinaryClassificationTrainer.ShortName)]
+        [TlcModule.EntryPoint(Name = "Trainers.FastTreeBinaryClassifier", 
+            Desc = FastTreeBinaryClassificationTrainer.Summary, 
+            Remarks = FastTreeBinaryClassificationTrainer.Remarks, 
+            UserName = FastTreeBinaryClassificationTrainer.UserNameValue, 
+            ShortName = FastTreeBinaryClassificationTrainer.ShortName)]
         public static CommonOutputs.BinaryClassificationOutput TrainBinary(IHostEnvironment env, FastTreeBinaryClassificationTrainer.Arguments input)
         {
             Contracts.CheckValue(env, nameof(env));
 
@@ -1096,7 +1096,11 @@ public static FastTreeRankingPredictor Create(IHostEnvironment env, ModelLoadCon
 
     public static partial class FastTree
     {
-        [TlcModule.EntryPoint(Name = "Trainers.FastTreeRanker", Desc = FastTreeRankingTrainer.Summary, UserName = FastTreeRankingTrainer.UserNameValue, ShortName = FastTreeRankingTrainer.ShortName)]
+        [TlcModule.EntryPoint(Name = "Trainers.FastTreeRanker", 
+            Desc = FastTreeRankingTrainer.Summary, 
+            Remarks = FastTreeRankingTrainer.Remarks,
+            UserName = FastTreeRankingTrainer.UserNameValue, 
+            ShortName = FastTreeRankingTrainer.ShortName)]
         public static CommonOutputs.RankingOutput TrainRanking(IHostEnvironment env, FastTreeRankingTrainer.Arguments input)
         {
             Contracts.CheckValue(env, nameof(env));
 
@@ -448,7 +448,11 @@ public static FastTreeRegressionPredictor Create(IHostEnvironment env, ModelLoad
 
     public static partial class FastTree
     {
-        [TlcModule.EntryPoint(Name = "Trainers.FastTreeRegressor", Desc = FastTreeRegressionTrainer.Summary, UserName = FastTreeRegressionTrainer.UserNameValue, ShortName = FastTreeRegressionTrainer.ShortName)]
+        [TlcModule.EntryPoint(Name = "Trainers.FastTreeRegressor",
+            Desc = FastTreeRegressionTrainer.Summary, 
+            Remarks = FastTreeRegressionTrainer.Remarks, 
+            UserName = FastTreeRegressionTrainer.UserNameValue, 
+            ShortName = FastTreeRegressionTrainer.ShortName)]
         public static CommonOutputs.RegressionOutput TrainRegression(IHostEnvironment env, FastTreeRegressionTrainer.Arguments input)
         {
             Contracts.CheckValue(env, nameof(env));
 
@@ -36,8 +36,11 @@ public sealed partial class FastTreeTweedieTrainer : BoostingFastTreeTrainerBase
     {
         public const string LoadNameValue = "FastTreeTweedieRegression";
         public const string UserNameValue = "FastTree (Boosted Trees) Tweedie Regression";
-        public const string Summary = "Trains gradient boosted decision trees to fit target values using a Tweedie loss function. This learner " +
-                                        "is a generalization of Poisson, compound Poisson, and gamma regression.";
+        public const string Summary = "Trains gradient boosted decision trees to fit target values using a Tweedie loss function. This learner is a generalization of Poisson, compound Poisson, and gamma regression.";
+        new public const string Remarks = @"<remarks>
+<a href='https://en.wikipedia.org/wiki/Gradient_boosting#Gradient_tree_boosting'>Wikipedia: Gradient boosting (Gradient tree boosting)</a>
+<a href='http://projecteuclid.org/DPubS?service=UI&version=1.0&verb=Display&handle=euclid.aos/1013203451'>Greedy function approximation: A gradient boosting machine</a>
+</remarks>";
 
         public const string ShortName = "fttweedie";
 
@@ -460,7 +463,10 @@ protected override void Map(ref VBuffer<float> src, ref float dst)
 
     public static partial class FastTree
     {
-        [TlcModule.EntryPoint(Name = "Trainers.FastTreeTweedieRegressor", Desc = FastTreeTweedieTrainer.Summary, UserName = FastTreeTweedieTrainer.UserNameValue, ShortName = FastTreeTweedieTrainer.ShortName)]
+        [TlcModule.EntryPoint(Name = "Trainers.FastTreeTweedieRegressor", 
+            Desc = FastTreeTweedieTrainer.Summary, 
+            UserName = FastTreeTweedieTrainer.UserNameValue, 
+            ShortName = FastTreeTweedieTrainer.ShortName)]
         public static CommonOutputs.RegressionOutput TrainTweedieRegression(IHostEnvironment env, FastTreeTweedieTrainer.Arguments input)
         {
             Contracts.CheckValue(env, nameof(env));
 
@@ -12,6 +12,28 @@ public abstract class RandomForestTrainerBase<TArgs, TPredictor> : FastTreeTrain
         where TArgs : FastForestArgumentsBase, new()
         where TPredictor : IPredictorProducing<Float>
     {
+        new internal const string Remarks = @"<remarks>
+Decision trees are non-parametric models that perform a sequence of simple tests on inputs. 
+This decision procedure maps them to outputs found in the training dataset whose inputs were similar to the instance being processed. 
+A decision is made at each node of the binary tree data structure based on a measure of similarity that maps each instance recursively through the branches of the tree until the appropriate leaf node is reached and the output decision returned.
+<para>Decision trees have several advantages:</para>
+<list type='bullet'>
+<item>They are efficient in both computation and memory usage during training and prediction. </item>
+<item>They can represent non-linear decision boundaries.</item>
+<item>They perform integrated feature selection and classification. </item>
+<item>They are resilient in the presence of noisy features.</item>
+</list>
+Fast forest is a random forest implementation. 
+The model consists of an ensemble of decision trees. Each tree in a decision forest outputs a Gaussian distribution by way of prediction. 
+An aggregation is performed over the ensemble of trees to find a Gaussian distribution closest to the combined distribution for all trees in the model.
+This decision forest classifier consists of an ensemble of decision trees. 
+Generally, ensemble models provide better coverage and accuracy than single decision trees. 
+Each tree in a decision forest outputs a Gaussian distribution.
+<a href='http://en.wikipedia.org/wiki/Random_forest'>Wikipedia: Random forest</a>
+<a href='http://jmlr.org/papers/volume7/meinshausen06a/meinshausen06a.pdf'>Quantile regression forest</a>
+<a href='https://blogs.technet.microsoft.com/machinelearning/2014/09/10/from-stumps-to-trees-to-forests/'>From Stumps to Trees to Forests</a>
+</remarks>";
+
         private readonly bool _quantileEnabled;
 
         protected RandomForestTrainerBase(IHostEnvironment env, TArgs args, bool quantileEnabled = false)
 
@@ -208,7 +208,11 @@ protected override void GetGradientInOneQuery(int query, int threadIndex)
 
     public static partial class FastForest
     {
-        [TlcModule.EntryPoint(Name = "Trainers.FastForestBinaryClassifier", Desc = FastForestClassification.Summary, UserName = FastForestClassification.UserNameValue, ShortName = FastForestClassification.ShortName)]
+        [TlcModule.EntryPoint(Name = "Trainers.FastForestBinaryClassifier", 
+            Desc = FastForestClassification.Summary, 
+            Remarks = FastForestClassification.Remarks, 
+            UserName = FastForestClassification.UserNameValue, 
+            ShortName = FastForestClassification.ShortName)]
         public static CommonOutputs.BinaryClassificationOutput TrainBinary(IHostEnvironment env, FastForestClassification.Arguments input)
         {
             Contracts.CheckValue(env, nameof(env));
 
@@ -280,7 +280,11 @@ public BasicImpl(Dataset trainData, Arguments args)
 
     public static partial class FastForest
     {
-        [TlcModule.EntryPoint(Name = "Trainers.FastForestRegressor", Desc = FastForestRegression.Summary, UserName = FastForestRegression.LoadNameValue, ShortName = FastForestRegression.ShortName)]
+        [TlcModule.EntryPoint(Name = "Trainers.FastForestRegressor", 
+            Desc = FastForestRegression.Summary, 
+            Remarks = FastForestRegression.Remarks,
+            UserName = FastForestRegression.LoadNameValue, 
+            ShortName = FastForestRegression.ShortName)]
         public static CommonOutputs.RegressionOutput TrainRegression(IHostEnvironment env, FastForestRegression.Arguments input)
         {
             Contracts.CheckValue(env, nameof(env));
Original file line number	Diff line number	Diff line change
`@@ -338,7 +338,11 @@ public void AdjustTreeOutputs(IChannel ch, RegressionTree tree,`
`338`	`338`
`339`	`339`	`public static partial class FastTree`
`340`	`340`	`{`
`341`		`- [TlcModule.EntryPoint(Name = "Trainers.FastTreeBinaryClassifier", Desc = FastTreeBinaryClassificationTrainer.Summary, UserName = FastTreeBinaryClassificationTrainer.UserNameValue, ShortName = FastTreeBinaryClassificationTrainer.ShortName)]`
	`341`	`+ [TlcModule.EntryPoint(Name = "Trainers.FastTreeBinaryClassifier",`
	`342`	`+ Desc = FastTreeBinaryClassificationTrainer.Summary,`
	`343`	`+ Remarks = FastTreeBinaryClassificationTrainer.Remarks,`
	`344`	`+ UserName = FastTreeBinaryClassificationTrainer.UserNameValue,`
	`345`	`+ ShortName = FastTreeBinaryClassificationTrainer.ShortName)]`
`342`	`346`	`public static CommonOutputs.BinaryClassificationOutput TrainBinary(IHostEnvironment env, FastTreeBinaryClassificationTrainer.Arguments input)`
`343`	`347`	`{`
`344`	`348`	`Contracts.CheckValue(env, nameof(env));`
Original file line number	Diff line number	Diff line change
`@@ -1096,7 +1096,11 @@ public static FastTreeRankingPredictor Create(IHostEnvironment env, ModelLoadCon`
`1096`	`1096`
`1097`	`1097`	`public static partial class FastTree`
`1098`	`1098`	`{`
`1099`		`- [TlcModule.EntryPoint(Name = "Trainers.FastTreeRanker", Desc = FastTreeRankingTrainer.Summary, UserName = FastTreeRankingTrainer.UserNameValue, ShortName = FastTreeRankingTrainer.ShortName)]`
	`1099`	`+ [TlcModule.EntryPoint(Name = "Trainers.FastTreeRanker",`
	`1100`	`+ Desc = FastTreeRankingTrainer.Summary,`
	`1101`	`+ Remarks = FastTreeRankingTrainer.Remarks,`
	`1102`	`+ UserName = FastTreeRankingTrainer.UserNameValue,`
	`1103`	`+ ShortName = FastTreeRankingTrainer.ShortName)]`
`1100`	`1104`	`public static CommonOutputs.RankingOutput TrainRanking(IHostEnvironment env, FastTreeRankingTrainer.Arguments input)`
`1101`	`1105`	`{`
`1102`	`1106`	`Contracts.CheckValue(env, nameof(env));`
Original file line number	Diff line number	Diff line change
`@@ -448,7 +448,11 @@ public static FastTreeRegressionPredictor Create(IHostEnvironment env, ModelLoad`
`448`	`448`
`449`	`449`	`public static partial class FastTree`
`450`	`450`	`{`
`451`		`- [TlcModule.EntryPoint(Name = "Trainers.FastTreeRegressor", Desc = FastTreeRegressionTrainer.Summary, UserName = FastTreeRegressionTrainer.UserNameValue, ShortName = FastTreeRegressionTrainer.ShortName)]`
	`451`	`+ [TlcModule.EntryPoint(Name = "Trainers.FastTreeRegressor",`
	`452`	`+ Desc = FastTreeRegressionTrainer.Summary,`
	`453`	`+ Remarks = FastTreeRegressionTrainer.Remarks,`
	`454`	`+ UserName = FastTreeRegressionTrainer.UserNameValue,`
	`455`	`+ ShortName = FastTreeRegressionTrainer.ShortName)]`
`452`	`456`	`public static CommonOutputs.RegressionOutput TrainRegression(IHostEnvironment env, FastTreeRegressionTrainer.Arguments input)`
`453`	`457`	`{`
`454`	`458`	`Contracts.CheckValue(env, nameof(env));`
Original file line number	Diff line number	Diff line change
`@@ -208,7 +208,11 @@ protected override void GetGradientInOneQuery(int query, int threadIndex)`
`208`	`208`
`209`	`209`	`public static partial class FastForest`
`210`	`210`	`{`
`211`		`- [TlcModule.EntryPoint(Name = "Trainers.FastForestBinaryClassifier", Desc = FastForestClassification.Summary, UserName = FastForestClassification.UserNameValue, ShortName = FastForestClassification.ShortName)]`
	`211`	`+ [TlcModule.EntryPoint(Name = "Trainers.FastForestBinaryClassifier",`
	`212`	`+ Desc = FastForestClassification.Summary,`
	`213`	`+ Remarks = FastForestClassification.Remarks,`
	`214`	`+ UserName = FastForestClassification.UserNameValue,`
	`215`	`+ ShortName = FastForestClassification.ShortName)]`
`212`	`216`	`public static CommonOutputs.BinaryClassificationOutput TrainBinary(IHostEnvironment env, FastForestClassification.Arguments input)`
`213`	`217`	`{`
`214`	`218`	`Contracts.CheckValue(env, nameof(env));`
Original file line number	Diff line number	Diff line change
`@@ -280,7 +280,11 @@ public BasicImpl(Dataset trainData, Arguments args)`
`280`	`280`
`281`	`281`	`public static partial class FastForest`
`282`	`282`	`{`
`283`		`- [TlcModule.EntryPoint(Name = "Trainers.FastForestRegressor", Desc = FastForestRegression.Summary, UserName = FastForestRegression.LoadNameValue, ShortName = FastForestRegression.ShortName)]`
	`283`	`+ [TlcModule.EntryPoint(Name = "Trainers.FastForestRegressor",`
	`284`	`+ Desc = FastForestRegression.Summary,`
	`285`	`+ Remarks = FastForestRegression.Remarks,`
	`286`	`+ UserName = FastForestRegression.LoadNameValue,`
	`287`	`+ ShortName = FastForestRegression.ShortName)]`
`284`	`288`	`public static CommonOutputs.RegressionOutput TrainRegression(IHostEnvironment env, FastForestRegression.Arguments input)`
`285`	`289`	`{`
`286`	`290`	`Contracts.CheckValue(env, nameof(env));`