1 write to _vocab
Microsoft.ML.Tokenizers (1)
Model\SentencePieceUnigramModel.cs (1)
29_vocab = new SortedDictionary<string, int>(OrdinalUtf8StringComparer.Instance);
8 references to _vocab
Microsoft.ML.Tokenizers (8)
Model\SentencePieceUnigramModel.cs (8)
52_vocab.Add(piece, i); 67ByteCodeToIdOffset = _vocab.TryGetValue("<0x00>", out int id) ? id : MaxByteId; 71_trie = new DoubleArrayTrie(_vocab); 81_vocab[modelProto.TrainerSpec.UnkPiece] = modelProto.TrainerSpec.UnkId; 82_vocab[modelProto.TrainerSpec.BosPiece] = modelProto.TrainerSpec.BosId; 83_vocab[modelProto.TrainerSpec.EosPiece] = modelProto.TrainerSpec.EosId; 91_vocab[modelProto.TrainerSpec.PadPiece] = modelProto.TrainerSpec.PadId; 96public override IReadOnlyDictionary<string, int> Vocabulary => new ReadOnlyDictionary<string, int>(_vocab);