1 write to ContinuingSubwordPrefix
Microsoft.ML.Tokenizers (1)
Model\WordPieceTokenizer.cs (1)
74
ContinuingSubwordPrefix
= continuingSubwordPrefix;
16 references to ContinuingSubwordPrefix
Microsoft.ML.Tokenizers (15)
Model\WordPieceTokenizer.cs (15)
378
int maxLength = MaxInputCharsPerWord +
ContinuingSubwordPrefix
.Length;
381
ContinuingSubwordPrefix
.AsSpan().CopyTo(buffer);
400
subStr.CopyTo(buffer.Slice(
ContinuingSubwordPrefix
.Length));
401
subStr = buffer.Slice(0,
ContinuingSubwordPrefix
.Length + subStr.Length);
518
int maxLength = MaxInputCharsPerWord +
ContinuingSubwordPrefix
.Length;
521
ContinuingSubwordPrefix
.AsSpan().CopyTo(buffer);
541
subStr.CopyTo(buffer.Slice(
ContinuingSubwordPrefix
.Length));
542
subStr = buffer.Slice(0,
ContinuingSubwordPrefix
.Length + subStr.Length);
749
if (token.StartsWith(
ContinuingSubwordPrefix
))
751
sb.Append(token.AsSpan().Slice(
ContinuingSubwordPrefix
.Length));
808
if (token.StartsWith(
ContinuingSubwordPrefix
, StringComparison.Ordinal))
810
if (token.Length -
ContinuingSubwordPrefix
.Length > buffer.Length)
814
token.AsSpan().Slice(
ContinuingSubwordPrefix
.Length).CopyTo(buffer);
815
buffer = buffer.Slice(token.Length -
ContinuingSubwordPrefix
.Length);
816
charsWritten += token.Length -
ContinuingSubwordPrefix
.Length;
Microsoft.ML.Tokenizers.Tests (1)
WordPieceTests.cs (1)
42
Assert.Equal("##", tokenizer.
ContinuingSubwordPrefix
);