13 instantiations of SentencePieceNormalizer
Microsoft.ML.Tokenizers (2)
Model\SentencePieceBaseModel.cs (2)
54
Normalizer = new
SentencePieceNormalizer
(
115
Normalizer = new
SentencePieceNormalizer
(
Microsoft.ML.Tokenizers.Tests (11)
LlamaTests.cs (11)
397
SentencePieceNormalizer normalizer = new
SentencePieceNormalizer
(removeExtraWhiteSpaces: false, addDummyPrefix: false, escapeWhiteSpaces: false, treatWhitespaceAsSuffix: false, specialTokens: null);
401
normalizer = new
SentencePieceNormalizer
(removeExtraWhiteSpaces: true, addDummyPrefix: false, escapeWhiteSpaces: false, treatWhitespaceAsSuffix: false, specialTokens: null);
405
normalizer = new
SentencePieceNormalizer
(removeExtraWhiteSpaces: true, addDummyPrefix: true, escapeWhiteSpaces: false, treatWhitespaceAsSuffix: false, specialTokens: null);
409
normalizer = new
SentencePieceNormalizer
(removeExtraWhiteSpaces: true, addDummyPrefix: true, escapeWhiteSpaces: true, treatWhitespaceAsSuffix: false, specialTokens: null);
413
normalizer = new
SentencePieceNormalizer
(removeExtraWhiteSpaces: false, addDummyPrefix: true, escapeWhiteSpaces: true, treatWhitespaceAsSuffix: false, specialTokens: null);
417
normalizer = new
SentencePieceNormalizer
(removeExtraWhiteSpaces: true, addDummyPrefix: true, escapeWhiteSpaces: true, treatWhitespaceAsSuffix: true, specialTokens: null);
421
normalizer = new
SentencePieceNormalizer
(removeExtraWhiteSpaces: true, addDummyPrefix: false, escapeWhiteSpaces: true, treatWhitespaceAsSuffix: true, specialTokens: null);
425
normalizer = new
SentencePieceNormalizer
(removeExtraWhiteSpaces: false, addDummyPrefix: true, escapeWhiteSpaces: true, treatWhitespaceAsSuffix: true, specialTokens: null);
429
normalizer = new
SentencePieceNormalizer
(removeExtraWhiteSpaces: false, addDummyPrefix: true, escapeWhiteSpaces: false, treatWhitespaceAsSuffix: true, specialTokens: null);
433
normalizer = new
SentencePieceNormalizer
(removeExtraWhiteSpaces: false, addDummyPrefix: true, escapeWhiteSpaces: true, treatWhitespaceAsSuffix: false, specialTokens: (_llamaPhi3Tokenizer as LlamaTokenizer)!.SpecialTokens);
441
normalizer = new
SentencePieceNormalizer
(removeExtraWhiteSpaces: false, addDummyPrefix: true, escapeWhiteSpaces: true, treatWhitespaceAsSuffix: true, specialTokens: (_llamaPhi3Tokenizer as LlamaTokenizer)!.SpecialTokens);
8 references to SentencePieceNormalizer
Microsoft.ML.Tokenizers (6)
Model\SentencePieceBaseModel.cs (5)
161
public
SentencePieceNormalizer
? Normalizer { get; }
226
char prefixSuffixChar = EscapeWhiteSpaces ?
SentencePieceNormalizer
.DummyPrefix : ' ';
318
Debug.Assert(sb[suffixIndex] ==
SentencePieceNormalizer
.DummyPrefix);
334
return EscapeWhiteSpaces ? sb.ToString(
SentencePieceNormalizer
.DummyPrefix, ' ') : sb.ToString();
451
char prefixSuffixChar = EscapeWhiteSpaces ?
SentencePieceNormalizer
.DummyPrefix : ' ';
Normalizer\SentencePieceNormalizer.cs (1)
463
static void AddWhiteSpace(
SentencePieceNormalizer
normalizer, Span<byte> normalized, ref int normalizedIndex, ref byte[]? poolArray)
Microsoft.ML.Tokenizers.Tests (2)
LlamaTests.cs (2)
75
propertyInfo = typeof(
SentencePieceNormalizer
).GetProperty("TreatWhitespaceAsSuffix", BindingFlags.Instance | BindingFlags.NonPublic | BindingFlags.Public);
397
SentencePieceNormalizer
normalizer = new SentencePieceNormalizer(removeExtraWhiteSpaces: false, addDummyPrefix: false, escapeWhiteSpaces: false, treatWhitespaceAsSuffix: false, specialTokens: null);