6 overrides of Decode
Microsoft.ML.Tokenizers (6)
Model\BPETokenizer.cs (1)
616
public override string
Decode
(IEnumerable<int> ids) => Decode(ids, considerSpecialTokens: true);
Model\CodeGenTokenizer.cs (1)
1234
public override string
Decode
(IEnumerable<int> ids) => Decode(ids, hasPrefixSpace: AddPrefixSpace, considerSpecialTokens: false);
Model\EnglishRobertaTokenizer.cs (1)
764
public override string
Decode
(IEnumerable<int> ids)
Model\SentencePieceTokenizer.cs (1)
1530
public override string
Decode
(IEnumerable<int> ids)
Model\TiktokenTokenizer.cs (1)
795
public override string
Decode
(IEnumerable<int> ids)
Model\WordPieceTokenizer.cs (1)
671
public override string
Decode
(IEnumerable<int> ids) => Decode(ids, skipSpecialTokens: false);
22 references to Decode
Microsoft.ML.Tokenizers.Tests (21)
BpeTests.cs (1)
266
Assert.Equal(decodedTokens, tokenizer.
Decode
(encodingIds));
CodeGenTests.cs (2)
254
Assert.Equal(text, tokenizer.
Decode
(ids));
257
Assert.Equal(text, tokenizer.
Decode
(ids));
EnglishRobertaTests.cs (1)
280
Assert.Equal(expectedDecodedString, tokenizer.
Decode
(encodingIds));
LlamaTests.cs (5)
248
Assert.Equal(input, llamaTokenizer.
Decode
(ids));
270
Assert.Equal(input, llamaTokenizer.
Decode
(extractedIds));
280
Assert.Equal(input, llamaTokenizer.
Decode
(extractedIds));
290
Assert.Equal(input, llamaTokenizer.
Decode
(extractedIds));
347
Assert.Throws<ArgumentNullException>(() => llamaTokenizer.
Decode
(null!));
TiktokenTests.cs (11)
140
Assert.Equal(text, tokenizer.
Decode
(encoded)!);
193
Assert.Equal(text, GPT4.
Decode
(encoded));
224
Assert.Equal(text, gpt4Tokenizer.
Decode
(encoded));
236
Assert.Equal(text, GPT4.
Decode
(encoded));
271
Assert.Equal(text, GPT4.
Decode
(encoded));
297
Assert.Equal(text, GPT4o.
Decode
(encoded));
305
Assert.Equal(text, GPT4o.
Decode
(encoded));
333
Assert.Equal(text, GPT2.
Decode
(encoded));
352
Assert.Equal(text, P50kBase.
Decode
(encoded));
371
Assert.Equal(text, P50kEdit.
Decode
(encoded));
390
Assert.Equal(text, R50kBase.
Decode
(encoded));
TokenizerTests.cs (1)
26
tokenizer.
Decode
(Enumerable.Repeat("abcdefghijklmnopqrstuvwxyz", 100).SelectMany(s => s.Select(c => c - 'a'))));
Microsoft.ML.TorchSharp (1)
Roberta\QATrainer.cs (1)
927
outputCache.PredictedAnswersBuffer[index] = new ReadOnlyMemory<char>(_parent.Tokenizer.
Decode
(_parent.Tokenizer.RobertaModel().ConvertOccurrenceRanksToIds(contextIds).ToArray().AsSpan(predictStart - questionLength - 2, predictEnd - predictStart).ToArray()).Trim().ToCharArray());