1 write to EndOfSentenceToken
Microsoft.ML.Tokenizers (1)
Model\CodeGenTokenizer.cs (1)
143
EndOfSentenceToken
= endOfSentenceToken;
17 references to EndOfSentenceToken
Microsoft.ML.Tokenizers (10)
Model\CodeGenTokenizer.cs (10)
169
if (!string.IsNullOrEmpty(
EndOfSentenceToken
))
171
if (!_vocab.TryGetValue(
EndOfSentenceToken
!, out (int endOfSentenceId, string token) value))
173
throw new ArgumentException($"The end of sentence token '{
EndOfSentenceToken
}' is not found in the vocabulary.");
184
if (AddEndOfSentence && string.IsNullOrEmpty(
EndOfSentenceToken
))
402
tokens.Add(new EncodedToken(EndOfSentenceId.Value,
EndOfSentenceToken
!, new Range(index, index)));
1275
Helpers.AppendToBytesArray(
EndOfSentenceToken
!.AsSpan(), ref bytes, ref bytesIndex);
1402
if (
EndOfSentenceToken
!.Length > buffer.Length)
1407
EndOfSentenceToken
.AsSpan().CopyTo(buffer);
1408
buffer = buffer.Slice(
EndOfSentenceToken
.Length);
1409
charsWritten +=
EndOfSentenceToken
.Length;
Microsoft.ML.Tokenizers.Tests (7)
CodeGenTests.cs (7)
294
string targetText = $"{codeGenTokenizer.BeginningOfSentenceToken}{text}{codeGenTokenizer.
EndOfSentenceToken
}";
683
Assert.True(codeGenTokenizer.
EndOfSentenceToken
is not null);
688
tokensList.Add(codeGenTokenizer.
EndOfSentenceToken
!);
711
tokensList.Add(codeGenTokenizer.
EndOfSentenceToken
!);
823
tokensList.Add(codeGenTokenizer.
EndOfSentenceToken
!);
852
tokensList.Add(codeGenTokenizer.
EndOfSentenceToken
!);
979
Assert.Equal(DefaultSpecialToken, codeGenTokenizer.
EndOfSentenceToken
);