13 references to BeginningOfSentenceToken
Microsoft.ML.Tokenizers.Tests (13)
LlamaTests.cs (3)
366Assert.Equal("<s>", bpe.BeginningOfSentenceToken); 665Assert.Equal(new[] { tokenizer.BeginningOfSentenceToken, kvp.Key }, encodedTokens.Select(et => et.Value).ToArray()); 838string textWithSpecialTokens = $"{tokenizer.BeginningOfSentenceToken}{text}";
UnigramTests.cs (10)
335Assert.True(writableTokens[0].Value == tokenizer.BeginningOfSentenceToken); 452string newString = $"{_unigramTokenizer.BeginningOfSentenceToken}{inputText}<pad>{inputText}{_unigramTokenizer.EndOfSentenceToken}"; 465expectedTokens[0] = _unigramTokenizerWithSpecialTokens.BeginningOfSentenceToken; 472newString = $"{_unigramTokenizerFromJson.BeginningOfSentenceToken}{inputText}<pad>{inputText}{_unigramTokenizerFromJson.EndOfSentenceToken}"; 485expectedTokens[0] = _unigramTokenizerFromJson.BeginningOfSentenceToken; 664inputText = $"{_unigramTokenizerWithSpecialTokens.BeginningOfSentenceToken}{inputText}<pad>{inputText}{_unigramTokenizerWithSpecialTokens.EndOfSentenceToken}"; 671string expectedNormalized = $"{_unigramTokenizerWithSpecialTokens.BeginningOfSentenceToken}{normalizedText}<pad>{normalizedText}{_unigramTokenizerWithSpecialTokens.EndOfSentenceToken}"; 690expectedNormalized = $"{_unigramTokenizerFromJson.BeginningOfSentenceToken}{normalizedText}<pad>{normalizedText}{_unigramTokenizerFromJson.EndOfSentenceToken}"; 805Assert.Equal("<s>", _unigramTokenizer.BeginningOfSentenceToken); 816Assert.Equal("<s>", _unigramTokenizerFromJson.BeginningOfSentenceToken);