4 writes to LowerCaseBeforeTokenization
Microsoft.ML.Tokenizers.Tests (4)
BertTokenizerTests.cs (4)
184
BertTokenizer[] bertTokenizers = [BertTokenizer.Create(vocabFile, new BertOptions {
LowerCaseBeforeTokenization
= false }),
185
BertTokenizer.Create(vocabStream, new BertOptions {
LowerCaseBeforeTokenization
= false })];
252
bertTokenizer = await BertTokenizer.CreateAsync(vocabStream, new BertOptions {
LowerCaseBeforeTokenization
= false }); // no lowercasing and no accent stripping
281
bertTokenizer = await BertTokenizer.CreateAsync(vocabStream, new BertOptions {
LowerCaseBeforeTokenization
= false, RemoveNonSpacingMarks = true }); // no lowercasing and accent stripping
3 references to LowerCaseBeforeTokenization
Microsoft.ML.Tokenizers (3)
Model\BertTokenizer.cs (3)
34
LowerCaseBeforeTokenization = options!.
LowerCaseBeforeTokenization
;
763
options.Normalizer ??= options.ApplyBasicTokenization ? new BertNormalizer(options.
LowerCaseBeforeTokenization
, options.IndividuallyTokenizeCjk, options.RemoveNonSpacingMarks) : null;
768
bool lowerCase = options.ApplyBasicTokenization && options.
LowerCaseBeforeTokenization
;