9 references to GetUtf8Bytes
Microsoft.ML.Tokenizers (9)
Model\CodeGenTokenizer.cs (1)
1298bytesIndex += Helpers.GetUtf8Bytes(removePrefixSpace ? specialToken.AsSpan().Slice(1) : specialToken.AsSpan(), bytes.AsSpan().Slice(bytesIndex));
Model\SentencePieceBpeModel.cs (4)
236int bytesWritten = Helpers.GetUtf8Bytes(text.Slice(i), utf8Bytes); 536int bytesWritten = Helpers.GetUtf8Bytes(text.Slice(i), utf8Bytes); 799int encodedCount = Helpers.GetUtf8Bytes(text.Slice(i), utf8Bytes); 1075int encodedCount = Helpers.GetUtf8Bytes(text.Slice(0, i + 1), utf8Bytes);
Model\SentencePieceUnigramModel.cs (1)
299int byteCount = Helpers.GetUtf8Bytes(text, byteSpan);
Utils\DoubleArrayTrie.cs (1)
758encodingLength = Helpers.GetUtf8Bytes(pair.Key.AsSpan(), bytes);
Utils\OrdinalUtf8StringComparer.cs (2)
73xLen = Helpers.GetUtf8Bytes(x.AsSpan(i), buffer1); 74yLen = Helpers.GetUtf8Bytes(y.AsSpan(i), buffer2);