2 instantiations of ModelProto
Microsoft.ML.Tokenizers (2)
SentencepieceModel.cs (2)
3878
private static readonly pb::MessageParser<ModelProto> _parser = new pb::MessageParser<ModelProto>(() => new
ModelProto
());
3921
return new
ModelProto
(this);
70 references to ModelProto
Microsoft.ML.Tokenizers (70)
Model\LlamaTokenizer.cs (3)
19
internal LlamaTokenizer(
ModelProto
modelProto, bool addBos, bool addEos, IReadOnlyDictionary<string, int>? addedTokens = null) : base(modelProto, addBos, addEos, addedTokens)
40
ModelProto
modelProto =
ModelProto
.Parser.ParseFrom(modelStream);
Model\SentencePieceBaseModel.cs (1)
18
internal SentencePieceBaseModel(
ModelProto
modelProto, bool addBos = false, bool addEos = false, IReadOnlyDictionary<string, int>? specialTokens = null)
Model\SentencePieceBpeModel.cs (12)
26
internal SentencePieceBpeModel(
ModelProto
modelProto, bool addBos, bool addEos, IReadOnlyDictionary<string, int>? specialTokens = null) : base(modelProto, addBos, addEos, specialTokens)
34
if (piece.Type ==
ModelProto
.Types.SentencePiece.Types.Type.Byte)
56
_vocab.Add(new StringSpanOrdinalKey(item.Token), (id, item.Score, (byte)
ModelProto
.Types.SentencePiece.Types.Type.Normal));
226
if (type != (byte)
ModelProto
.Types.SentencePiece.Types.Type.Unused)
314
if (id.Type != (byte)
ModelProto
.Types.SentencePiece.Types.Type.Unused ||
504
if (type != (byte)
ModelProto
.Types.SentencePiece.Types.Type.Unused)
619
if (id.Type != (byte)
ModelProto
.Types.SentencePiece.Types.Type.Unused ||
772
if (type != (byte)
ModelProto
.Types.SentencePiece.Types.Type.Unused)
878
if (id.Type != (byte)
ModelProto
.Types.SentencePiece.Types.Type.Unused ||
1048
if (type != (byte)
ModelProto
.Types.SentencePiece.Types.Type.Unused)
1154
if (id.Type != (byte)
ModelProto
.Types.SentencePiece.Types.Type.Unused ||
1254
if (leftId.Type == (byte)
ModelProto
.Types.SentencePiece.Types.Type.Unused)
Model\SentencePieceTokenizer.cs (3)
23
internal SentencePieceTokenizer(
ModelProto
modelProto, bool addBos, bool addEos, IReadOnlyDictionary<string, int>? specialTokens = null)
461
ModelProto
modelProto =
ModelProto
.Parser.ParseFrom(modelStream);
Model\SentencePieceUnigramModel.cs (17)
21
private readonly (string Piece, float Score,
ModelProto
.Types.SentencePiece.Types.Type Type)[] _vocabReverse;
27
public SentencePieceUnigramModel(
ModelProto
modelProto, bool addBos, bool addEos, IReadOnlyDictionary<string, int>? specialTokens = null) : base(modelProto, addBos, addEos, specialTokens)
30
_vocabReverse = new (string Piece, float Score,
ModelProto
.Types.SentencePiece.Types.Type Type)[modelProto.Pieces.Count];
37
if (modelProto.Pieces[i].Type ==
ModelProto
.Types.SentencePiece.Types.Type.Normal ||
38
modelProto.Pieces[i].Type ==
ModelProto
.Types.SentencePiece.Types.Type.UserDefined ||
39
modelProto.Pieces[i].Type ==
ModelProto
.Types.SentencePiece.Types.Type.Unused)
48
else if (modelProto.Pieces[i].Type ==
ModelProto
.Types.SentencePiece.Types.Type.Byte)
52
else if (modelProto.Pieces[i].Type ==
ModelProto
.Types.SentencePiece.Types.Type.Unknown)
55
_vocabReverse[i] = (modelProto.Pieces[i].Piece, modelProto.Pieces[i].Score,
ModelProto
.Types.SentencePiece.Types.Type.Unknown);
77
_vocabReverse[modelProto.TrainerSpec.BosId] = (modelProto.TrainerSpec.BosPiece, 0f,
ModelProto
.Types.SentencePiece.Types.Type.Control);
78
_vocabReverse[modelProto.TrainerSpec.EosId] = (modelProto.TrainerSpec.EosPiece, 0f,
ModelProto
.Types.SentencePiece.Types.Type.Control);
79
_vocabReverse[modelProto.TrainerSpec.UnkId] = (modelProto.TrainerSpec.UnkPiece, 0f,
ModelProto
.Types.SentencePiece.Types.Type.Unknown);
84
_vocabReverse[modelProto.TrainerSpec.PadId] = (modelProto.TrainerSpec.PadPiece, 0f,
ModelProto
.Types.SentencePiece.Types.Type.Control);
94
List<(string Piece, float Score,
ModelProto
.Types.SentencePiece.Types.Type Type)> vocabReverse = new(250_000);
103
vocabReverse.Add((item.Token, item.Score,
ModelProto
.Types.SentencePiece.Types.Type.Normal));
556
if (_vocabReverse[ret].Type ==
ModelProto
.Types.SentencePiece.Types.Type.Unused)
566
float score = _vocabReverse[ret].Type ==
ModelProto
.Types.SentencePiece.Types.Type.UserDefined ? length * _maxScore - 0.1f : _vocabReverse[ret].Score;
SentencepieceModel.cs (34)
104
new pbr::GeneratedClrTypeInfo(typeof(global::Sentencepiece.
ModelProto
), global::Sentencepiece.
ModelProto
.Parser, new[]{ "Pieces", "TrainerSpec", "NormalizerSpec", "SelfTestData", "DenormalizerSpec" }, null, null, null, new pbr::GeneratedClrTypeInfo[] { new pbr::GeneratedClrTypeInfo(typeof(global::Sentencepiece.
ModelProto
.Types.SentencePiece), global::Sentencepiece.
ModelProto
.Types.SentencePiece.Parser, new[]{ "Piece", "Score", "Type" }, null, new[]{ typeof(global::Sentencepiece.
ModelProto
.Types.SentencePiece.Types.Type) }, null, null)})
3873
internal sealed partial class ModelProto : pb::IExtendableMessage<
ModelProto
>
3878
private static readonly pb::MessageParser<
ModelProto
> _parser = new pb::MessageParser<
ModelProto
>(() => new ModelProto());
3880
private pb::ExtensionSet<
ModelProto
> _extensions;
3881
private pb::ExtensionSet<
ModelProto
> _Extensions { get { return _extensions; } }
3884
public static pb::MessageParser<
ModelProto
> Parser { get { return _parser; } }
3908
public ModelProto(
ModelProto
other) : this() {
3920
public
ModelProto
Clone() {
3926
private static readonly pb::FieldCodec<global::Sentencepiece.
ModelProto
.Types.SentencePiece> _repeated_pieces_codec
3927
= pb::FieldCodec.ForMessage(10, global::Sentencepiece.
ModelProto
.Types.SentencePiece.Parser);
3928
private readonly pbc::RepeatedField<global::Sentencepiece.
ModelProto
.Types.SentencePiece> pieces_ = new pbc::RepeatedField<global::Sentencepiece.
ModelProto
.Types.SentencePiece>();
3934
public pbc::RepeatedField<global::Sentencepiece.
ModelProto
.Types.SentencePiece> Pieces {
4001
return Equals(other as
ModelProto
);
4006
public bool Equals(
ModelProto
other) {
4138
public void MergeFrom(
ModelProto
other) {
4271
public TValue GetExtension<TValue>(pb::Extension<
ModelProto
, TValue> extension) {
4274
public pbc::RepeatedField<TValue> GetExtension<TValue>(pb::RepeatedExtension<
ModelProto
, TValue> extension) {
4277
public pbc::RepeatedField<TValue> GetOrInitializeExtension<TValue>(pb::RepeatedExtension<
ModelProto
, TValue> extension) {
4280
public void SetExtension<TValue>(pb::Extension<
ModelProto
, TValue> extension, TValue value) {
4283
public bool HasExtension<TValue>(pb::Extension<
ModelProto
, TValue> extension) {
4286
public void ClearExtension<TValue>(pb::Extension<
ModelProto
, TValue> extension) {
4289
public void ClearExtension<TValue>(pb::RepeatedExtension<
ModelProto
, TValue> extension) {
4316
get { return global::Sentencepiece.
ModelProto
.Descriptor.NestedTypes[0]; }
4408
private readonly static global::Sentencepiece.
ModelProto
.Types.SentencePiece.Types.Type TypeDefaultValue = global::Sentencepiece.
ModelProto
.Types.SentencePiece.Types.Type.Normal;
4410
private global::Sentencepiece.
ModelProto
.Types.SentencePiece.Types.Type type_;
4413
public global::Sentencepiece.
ModelProto
.Types.SentencePiece.Types.Type Type {
4624
Type = (global::Sentencepiece.
ModelProto
.Types.SentencePiece.Types.Type) input.ReadEnum();