6 overrides of Decode
Microsoft.ML.Tokenizers (6)
Model\BPETokenizer.cs (1)
773
public override string
Decode
(IEnumerable<int> ids) => Decode(ids, considerSpecialTokens: true);
Model\CodeGenTokenizer.cs (1)
1237
public override string
Decode
(IEnumerable<int> ids) => Decode(ids, hasPrefixSpace: AddPrefixSpace, considerSpecialTokens: false);
Model\EnglishRobertaTokenizer.cs (1)
764
public override string
Decode
(IEnumerable<int> ids)
Model\SentencePieceTokenizer.cs (1)
401
public override string
Decode
(IEnumerable<int> ids) => _model.Decode(ids, considerSpecialTokens: false);
Model\TiktokenTokenizer.cs (1)
795
public override string
Decode
(IEnumerable<int> ids)
Model\WordPieceTokenizer.cs (1)
671
public override string
Decode
(IEnumerable<int> ids) => Decode(ids, skipSpecialTokens: false);
33 references to Decode
Microsoft.ML.GenAI.Core (2)
Pipeline\CausalLMPipeline.cs (2)
276
_ => this.Tokenizer.
Decode
(tokenIds.Concat(tokenIds)) ?? throw new InvalidOperationException("Failed to decode token ids"),
282
_ => this.Tokenizer.
Decode
(tokenIds) ?? throw new InvalidOperationException("Failed to decode token ids"),
Microsoft.ML.Tokenizers.Tests (30)
BpeTests.cs (1)
310
Assert.Equal(decodedTokens, tokenizer.
Decode
(encodingIds));
CodeGenTests.cs (2)
254
Assert.Equal(text, tokenizer.
Decode
(ids));
257
Assert.Equal(text, tokenizer.
Decode
(ids));
EnglishRobertaTests.cs (1)
280
Assert.Equal(expectedDecodedString, tokenizer.
Decode
(encodingIds));
LlamaTests.cs (5)
248
Assert.Equal(input, llamaTokenizer.
Decode
(ids));
270
Assert.Equal(input, llamaTokenizer.
Decode
(extractedIds));
280
Assert.Equal(input, llamaTokenizer.
Decode
(extractedIds));
290
Assert.Equal(input, llamaTokenizer.
Decode
(extractedIds));
347
Assert.Throws<ArgumentNullException>(() => llamaTokenizer.
Decode
(null!));
TiktokenTests.cs (17)
148
Assert.Equal(text, tokenizer.
Decode
(encoded)!);
201
Assert.Equal(text, GPT4.
Decode
(encoded));
232
Assert.Equal(text, gpt4Tokenizer.
Decode
(encoded));
244
Assert.Equal(text, GPT4.
Decode
(encoded));
279
Assert.Equal(text, GPT4.
Decode
(encoded));
344
Assert.Equal(text, GPT2.
Decode
(encoded));
363
Assert.Equal(text, P50kBase.
Decode
(encoded));
382
Assert.Equal(text, P50kEdit.
Decode
(encoded));
401
Assert.Equal(text, R50kBase.
Decode
(encoded));
796
Assert.Equal(text, Phi4.
Decode
(encoded));
865
string decoded = GPT4.
Decode
(ids);
871
string mixedDecoded = GPT4.
Decode
(mixedIds);
877
string boundaryDecoded = GPT4.
Decode
(boundaryIds);
883
string belowDecoded = GPT4.
Decode
(belowIds);
889
string aboveDecoded = GPT4.
Decode
(aboveIds);
908
string decodedRepeated = GPT4.
Decode
(idsRepeated);
914
string decodedMixed = GPT4.
Decode
(idsMixed);
TokenizerTests.cs (4)
20
Assert.Equal("", tokenizer.
Decode
([]));
22
Assert.Equal("hello", tokenizer.
Decode
([7, 4, 11, 11, 14]));
26
tokenizer.
Decode
(Enumerable.Repeat("abcdefghijklmnopqrstuvwxyz", 100).SelectMany(s => s.Select(c => c - 'a'))));
28
Assert.Throws<InvalidOperationException>(() => tokenizer.
Decode
([26, 27, 28, 29]));
Microsoft.ML.TorchSharp (1)
Roberta\QATrainer.cs (1)
927
outputCache.PredictedAnswersBuffer[index] = new ReadOnlyMemory<char>(_parent.Tokenizer.
Decode
(_parent.Tokenizer.RobertaModel().ConvertOccurrenceRanksToIds(contextIds).ToArray().AsSpan(predictStart - questionLength - 2, predictEnd - predictStart).ToArray()).Trim().ToCharArray());