3 overrides of PreTokenize
Microsoft.ML.Tokenizers (2)
PreTokenizer\RegexPreTokenizer.cs (1)
48
public override IEnumerable<(int Offset, int Length)>
PreTokenize
(string text)
PreTokenizer\RobertaPreTokenizer.cs (1)
25
public override IEnumerable<(int Offset, int Length)>
PreTokenize
(string text)
Microsoft.ML.Tokenizers.Tests (1)
PreTokenizerTests.cs (1)
116
public override IEnumerable<(int Offset, int Length)>
PreTokenize
(string text)
6 references to PreTokenize
Microsoft.ML.Tokenizers (3)
Tokenizer.cs (3)
450
splits = preTokenizer.
PreTokenize
(normalizedString);
472
splits = preTokenizer.
PreTokenize
(normalizedString);
481
splits = preTokenizer.
PreTokenize
(text);
Microsoft.ML.Tokenizers.Tests (2)
PreTokenizerTests.cs (2)
60
(int Offset, int Length)[] splitParts = preTokenizer.
PreTokenize
(text).ToArray<(int Offset, int Length)>();
73
Assert.Empty(PreTokenizer.CreateWordOrNonWordPreTokenizer().
PreTokenize
((string)null!));
Microsoft.ML.TorchSharp (1)
NasBert\NerTrainer.cs (1)
379
var pre = tokenizer.PreTokenizer.
PreTokenize
(sentence);