2 writes to TrainerSpec
Microsoft.ML.Tokenizers (2)
SentencepieceModel.cs (2)
4145
TrainerSpec
= new global::Sentencepiece.TrainerSpec();
4240
TrainerSpec
= new global::Sentencepiece.TrainerSpec();
43 references to TrainerSpec
Microsoft.ML.Tokenizers (43)
Model\LlamaTokenizer.cs (1)
47
if (modelProto.
TrainerSpec
.ModelType != TrainerSpec.Types.ModelType.Bpe)
Model\SentencePieceBaseModel.cs (9)
27
BeginningOfSentenceToken = modelProto.
TrainerSpec
.BosPiece ?? "<s>";
28
BeginningOfSentenceId = Math.Max(0, modelProto.
TrainerSpec
.BosId);
29
EndOfSentenceToken = modelProto.
TrainerSpec
.EosPiece ?? "</s>";
30
EndOfSentenceId = Math.Max(0, modelProto.
TrainerSpec
.EosId);
31
UnknownToken = modelProto.
TrainerSpec
.UnkPiece ?? "<unk>";
32
UnknownId = Math.Max(0, modelProto.
TrainerSpec
.UnkId);
35
TreatWhitespaceAsSuffix = modelProto.
TrainerSpec
.TreatWhitespaceAsSuffix;
36
ByteFallback = modelProto.
TrainerSpec
.ByteFallback;
58
modelProto.
TrainerSpec
.TreatWhitespaceAsSuffix,
Model\SentencePieceTokenizer.cs (2)
25
_model = modelProto.
TrainerSpec
.ModelType switch
29
_ => throw new ArgumentException($"The model type '{modelProto.
TrainerSpec
.ModelType}' is not supported.", nameof(modelProto))
Model\SentencePieceUnigramModel.cs (23)
31
if (modelProto.
TrainerSpec
.BosId >= modelProto.Pieces.Count ||
32
modelProto.
TrainerSpec
.EosId >= modelProto.Pieces.Count ||
33
modelProto.
TrainerSpec
.UnkId >= modelProto.Pieces.Count)
77
Debug.Assert(modelProto.
TrainerSpec
.UnkId >= 0);
78
Debug.Assert(modelProto.
TrainerSpec
.BosId >= 0);
79
Debug.Assert(modelProto.
TrainerSpec
.EosId >= 0);
81
_vocab[modelProto.
TrainerSpec
.UnkPiece] = modelProto.
TrainerSpec
.UnkId;
82
_vocab[modelProto.
TrainerSpec
.BosPiece] = modelProto.
TrainerSpec
.BosId;
83
_vocab[modelProto.
TrainerSpec
.EosPiece] = modelProto.
TrainerSpec
.EosId;
85
_vocabReverse[modelProto.
TrainerSpec
.BosId] = (modelProto.
TrainerSpec
.BosPiece, 0f, ModelProto.Types.SentencePiece.Types.Type.Control);
86
_vocabReverse[modelProto.
TrainerSpec
.EosId] = (modelProto.
TrainerSpec
.EosPiece, 0f, ModelProto.Types.SentencePiece.Types.Type.Control);
87
_vocabReverse[modelProto.
TrainerSpec
.UnkId] = (modelProto.
TrainerSpec
.UnkPiece, 0f, ModelProto.Types.SentencePiece.Types.Type.Unknown);
89
if (modelProto.
TrainerSpec
.PadId >= 0)
91
_vocab[modelProto.
TrainerSpec
.PadPiece] = modelProto.
TrainerSpec
.PadId;
92
_vocabReverse[modelProto.
TrainerSpec
.PadId] = (modelProto.
TrainerSpec
.PadPiece, 0f, ModelProto.Types.SentencePiece.Types.Type.Control);
SentencepieceModel.cs (8)
4014
if (!object.Equals(
TrainerSpec
, other.
TrainerSpec
)) return false;
4029
if (trainerSpec_ != null) hash ^=
TrainerSpec
.GetHashCode();
4087
output.WriteMessage(
TrainerSpec
);
4116
size += 1 + pb::CodedOutputStream.ComputeMessageSize(
TrainerSpec
);
4147
TrainerSpec
.MergeFrom(other.
TrainerSpec
);
4242
input.ReadMessage(
TrainerSpec
);