TrainContext.cs

// Licensed to the .NET Foundation under one or more agreements.
// The .NET Foundation licenses this file to you under the MIT license.
// See the LICENSE file in the project root for more information.
 
using Microsoft.ML.Data;
using Microsoft.ML.Runtime;
 
namespace Microsoft.ML;
 
/// <summary>
/// Holds information relevant to trainers. Instances of this class are meant to be constructed and passed
/// into <see cref="ITrainer{TPredictor}.Train(TrainContext)"/> or <see cref="ITrainer.Train(TrainContext)"/>.
/// This holds at least a training set, as well as optionally a predictor.
/// </summary>
[BestFriend]
internal sealed class TrainContext
{
    /// <summary>
    /// The training set. Cannot be <c>null</c>.
    /// </summary>
    public RoleMappedData TrainingSet { get; }
 
    /// <summary>
    /// The validation set. Can be <c>null</c>. Note that passing a non-<c>null</c> validation set into
    /// a trainer that does not support validation sets should not be considered an error condition. It
    /// should simply be ignored in that case.
    /// </summary>
    public RoleMappedData ValidationSet { get; }
 
    /// <summary>
    /// The test set, whose uses are very similar to validation set but it should not directly and indirectly
    /// affect the training process. One major difference between validation set and test test is that validation
    /// can affect the training process by, for example, early stopping. Note that early stopping is a technique
    /// which terminates the training process once the scores computed on validation set starts getting worse.
    /// </summary>
    public RoleMappedData TestSet { get; }
 
    /// <summary>
    /// The initial predictor, for incremental training. Note that if a <see cref="ITrainer"/> implementor
    /// does not support incremental training, then it can ignore it similarly to how one would ignore
    /// <see cref="ValidationSet"/>. However, if the trainer does support incremental training and there
    /// is something wrong with a non-<c>null</c> value of this, then the trainer ought to throw an exception.
    /// </summary>
    public IPredictor InitialPredictor { get; }
 
    /// <summary>
    /// Constructor, given a training set and optional other arguments.
    /// </summary>
    /// <param name="trainingSet">Will set <see cref="TrainingSet"/> to this value. This must be specified</param>
    /// <param name="validationSet">Will set <see cref="ValidationSet"/> to this value if specified</param>
    /// <param name="testSet">Will set <see cref="TestSet"/> to this value if specified</param>
    /// <param name="initialPredictor">Will set <see cref="InitialPredictor"/> to this value if specified</param>
    public TrainContext(RoleMappedData trainingSet, RoleMappedData validationSet = null, RoleMappedData testSet = null, IPredictor initialPredictor = null)
    {
        Contracts.CheckValue(trainingSet, nameof(trainingSet));
        Contracts.CheckValueOrNull(validationSet);
        Contracts.CheckValueOrNull(initialPredictor);
 
        // REVIEW: Should there be code here to ensure that the role mappings between the two are compatible?
        // That is, all the role mappings are the same and the columns between them have identical types?
 
        TrainingSet = trainingSet;
        ValidationSet = validationSet;
        TestSet = testSet;
        InitialPredictor = initialPredictor;
    }
}
File: Prediction\TrainContext.cs	Web Access
Project: src\src\Microsoft.ML.Core\Microsoft.ML.Core.csproj (Microsoft.ML.Core)