34 instantiations of StringSpanOrdinalKey
Microsoft.ML.Tokenizers (34)
Model\BertTokenizer.cs (7)
39
SeparatorTokenId = vocab[new
StringSpanOrdinalKey
(options.SeparatorToken)];
42
PaddingTokenId = vocab[new
StringSpanOrdinalKey
(options.PaddingToken)];
45
ClassificationTokenId = vocab[new
StringSpanOrdinalKey
(options.ClassificationToken)];
48
MaskingTokenId = vocab[new
StringSpanOrdinalKey
(options.MaskingToken)];
778
if (!vocab.TryGetValue(new
StringSpanOrdinalKey
(kvp.Key), out int id) || id != kvp.Value)
816
if (token is null || !vocab.TryGetValue(new
StringSpanOrdinalKey
(token), out int id))
835
vocab[new
StringSpanOrdinalKey
(normalizedToken)] = id;
Model\BPETokenizer.cs (1)
259
_specialTokens = specialTokens.ToDictionary(kvp => new
StringSpanOrdinalKey
(kvp.Key), kvp => (kvp.Value, kvp.Key));
Model\CodeGenTokenizer.cs (2)
134
_specialTokens = specialTokens.ToDictionary(kvp => new
StringSpanOrdinalKey
(kvp.Key), kvp => (kvp.Value, kvp.Key));
1628
return new List<EncodedToken> { new EncodedToken(_vocab[new
StringSpanOrdinalKey
(tokenValue)].Id, tokenValue, new Range(mapping[0], mapping[0] + 1)) };
Model\EnglishRobertaTokenizer.cs (2)
961
return new List<EncodedToken> { new EncodedToken(_vocab[new
StringSpanOrdinalKey
(tokenValue)], tokenValue, new Range(indexMapping[0], indexMapping[0] + 1)) };
1050
tokens.Add(new EncodedToken(_vocab[new
StringSpanOrdinalKey
(w)], w, new Range(indexMapping[index], indexMapping[index] + w.Length)));
Model\SentencePieceTokenizer.cs (2)
51
_vocab.Add(new
StringSpanOrdinalKey
(piece.Piece), (i, piece.Score, (byte)piece.Type));
85
_specialTokens.Add(new
StringSpanOrdinalKey
(item.Key), item.Value);
Model\TiktokenTokenizer.cs (1)
247
vocab[new
StringSpanOrdinalKey
(decodedToken)] = (rank, decodedToken);
Model\WordPieceTokenizer.cs (1)
110
vocab.Add(new
StringSpanOrdinalKey
(line), lineNumber);
Utils\LruCache.cs (5)
51
if (_cache.TryGetValue(new
StringSpanOrdinalKey
(key), out LinkedListNode<KeyValuePair<string, TValue>>? cached))
78
if (_cache.TryGetValue(new
StringSpanOrdinalKey
(ptr, key.Length), out LinkedListNode<KeyValuePair<string, TValue>>? cached))
101
if (_cache.TryGetValue(new
StringSpanOrdinalKey
(key), out LinkedListNode<KeyValuePair<string, TValue>>? cached))
113
_cache.Remove(new
StringSpanOrdinalKey
(nodeToEvict!.Value.Key));
117
_cache[new
StringSpanOrdinalKey
(key)] = node;
Utils\StringSpanOrdinalKey.cs (13)
56
_left = new
StringSpanOrdinalKey
(ptr1, length1);
57
_right = new
StringSpanOrdinalKey
(ptr2, length2);
62
_left = new
StringSpanOrdinalKey
(data1);
63
_right = new
StringSpanOrdinalKey
(data2);
93
return _map.TryGetValue(new
StringSpanOrdinalKey
(key), out value!);
103
return _map.TryGetValue(new
StringSpanOrdinalKey
(ptr, key.Length), out value!);
112
_map.Remove(new
StringSpanOrdinalKey
(key));
122
_map[new
StringSpanOrdinalKey
(k)] = v;
137
new
StringSpanOrdinalKey
(reader.GetString()!);
142
public override StringSpanOrdinalKey Read(ref Utf8JsonReader reader, Type typeToConvert, JsonSerializerOptions options) => new
StringSpanOrdinalKey
(reader.GetString()!);
163
dictionary.Add(new
StringSpanOrdinalKey
(key!), (value, key!));
181
return map.TryGetValue(new
StringSpanOrdinalKey
(ptr, key.Length), out value!);
186
map.TryGetValue(new
StringSpanOrdinalKey
(key), out value!);
60 references to StringSpanOrdinalKey
Microsoft.ML.Tokenizers (60)
Model\BertTokenizer.cs (5)
28
Dictionary<
StringSpanOrdinalKey
, int> vocab,
702
(Dictionary<
StringSpanOrdinalKey
, int> vocab, Dictionary<int, string> vocabReverse) = await LoadVocabAsync(vocabStream, useAsync: true, cancellationToken).ConfigureAwait(false);
743
(Dictionary<
StringSpanOrdinalKey
, int> vocab, Dictionary<int, string> vocabReverse) = LoadVocabAsync(vocabStream, useAsync: false).GetAwaiter().GetResult();
757
Dictionary<
StringSpanOrdinalKey
, int> vocab,
814
private static void AddSpecialToken(Dictionary<
StringSpanOrdinalKey
, int> vocab, Dictionary<string, int> specialTokens, string token, bool lowerCase, Dictionary<string, int>? notNormalizedSpecialTokens = null)
Model\BPETokenizer.cs (10)
32
private readonly Dictionary<
StringSpanOrdinalKey
, (int, string)>? _specialTokens;
129
(Dictionary<
StringSpanOrdinalKey
, int>? vocab, Vec<(string, string)> merges) result = ReadModelDataAsync(vocabStream, mergesStream, useAsync: false).GetAwaiter().GetResult();
176
(Dictionary<
StringSpanOrdinalKey
, int>? vocab, Vec<(string, string)> merges) result = ReadModelDataAsync(vocabStream, mergesStream, useAsync: false).GetAwaiter().GetResult();
212
(Dictionary<
StringSpanOrdinalKey
, int>? vocab, Vec<(string, string)> merges) result = await ReadModelDataAsync(vocabStream, mergesStream, useAsync: true).ConfigureAwait(false);
230
Dictionary<
StringSpanOrdinalKey
, int>? vocab,
246
_vocab = vocab ?? new Dictionary<
StringSpanOrdinalKey
, int>();
251
foreach (KeyValuePair<
StringSpanOrdinalKey
, int> kvp in _vocab)
773
internal static async ValueTask<(Dictionary<
StringSpanOrdinalKey
, int>?, Vec<(string, string)>)> ReadModelDataAsync(Stream vocab, Stream? merges, bool useAsync, CancellationToken cancellationToken = default)
775
Dictionary<
StringSpanOrdinalKey
, int>? dic = useAsync
787
private readonly Dictionary<
StringSpanOrdinalKey
, int> _vocab;
Model\CodeGenTokenizer.cs (3)
25
private readonly Dictionary<
StringSpanOrdinalKey
, (int Id, string Token)> _vocab;
28
private readonly Dictionary<
StringSpanOrdinalKey
, (int, string)>? _specialTokens;
1765
private static Dictionary<
StringSpanOrdinalKey
, (int, string)> GetVocabulary(Stream vocabularyStream)
Model\EnglishRobertaTokenizer.cs (5)
23
private readonly Dictionary<
StringSpanOrdinalKey
, int> _vocab;
25
private readonly SortedDictionary<int,
StringSpanOrdinalKey
> _vocabReverse;
179
private static Dictionary<
StringSpanOrdinalKey
, int> GetVocabulary(Stream vocabularyStream)
181
Dictionary<
StringSpanOrdinalKey
, int>? vocab;
278
if (_vocabReverse.TryGetValue(id, out
var
value))
Model\ModelSourceGenerationContext.cs (1)
10
[JsonSerializable(typeof(Dictionary<
StringSpanOrdinalKey
, int>))]
Model\SentencePieceTokenizer.cs (3)
28
private readonly Dictionary<
StringSpanOrdinalKey
, (int Id, float Score, byte Type)> _vocab = new();
36
private readonly Dictionary<
StringSpanOrdinalKey
, int>? _specialTokens;
80
_specialTokens = new Dictionary<
StringSpanOrdinalKey
, int>();
Model\TiktokenTokenizer.cs (8)
30
private readonly Dictionary<
StringSpanOrdinalKey
, (int Id, string Token)> _vocab;
79
Dictionary<
StringSpanOrdinalKey
, (int Id, string Token)> vocab,
157
internal static async ValueTask<(Dictionary<ReadOnlyMemory<byte>, int>, Dictionary<
StringSpanOrdinalKey
, (int Id, string Token)>, Dictionary<int, ReadOnlyMemory<byte>>)> LoadTiktokenBpeAsync(
161
Dictionary<
StringSpanOrdinalKey
, (int Id, string Token)> vocab;
183
vocab = new Dictionary<
StringSpanOrdinalKey
, (int Id, string Token)>(suggestedCapacity);
1197
private static readonly ConcurrentDictionary<string, (Dictionary<ReadOnlyMemory<byte>, int> encoder, Dictionary<
StringSpanOrdinalKey
, (int Id, string Token)> vocab, Dictionary<int, ReadOnlyMemory<byte>> decoder)> _tiktokenCache = new(StringComparer.OrdinalIgnoreCase);
1221
out (Dictionary<ReadOnlyMemory<byte>, int> encoder, Dictionary<
StringSpanOrdinalKey
, (int Id, string Token)> vocab, Dictionary<int, ReadOnlyMemory<byte>> decoder) cache))
1312
(Dictionary<ReadOnlyMemory<byte>, int> encoder, Dictionary<
StringSpanOrdinalKey
, (int Id, string Token)> vocab, Dictionary<int, ReadOnlyMemory<byte>> decoder) =
Model\WordPieceTokenizer.cs (7)
29
private readonly Dictionary<
StringSpanOrdinalKey
, int> _vocab;
33
Dictionary<
StringSpanOrdinalKey
, int> vocab,
92
internal static async ValueTask<(Dictionary<
StringSpanOrdinalKey
, int>, Dictionary<int, string>)> LoadVocabAsync(Stream vocabStream, bool useAsync, CancellationToken cancellationToken = default)
99
Dictionary<
StringSpanOrdinalKey
, int> vocab = new Dictionary<
StringSpanOrdinalKey
, int>();
163
(Dictionary<
StringSpanOrdinalKey
, int> vocab, Dictionary<int, string> vocabReverse) = LoadVocabAsync(vocabStream, useAsync: false).GetAwaiter().GetResult();
227
(Dictionary<
StringSpanOrdinalKey
, int> vocab, Dictionary<int, string> vocabReverse) = await LoadVocabAsync(vocabStream, useAsync: true, cancellationToken);
Utils\LruCache.cs (1)
17
private readonly Dictionary<
StringSpanOrdinalKey
, LinkedListNode<KeyValuePair<string, TValue>>> _cache = new();
Utils\StringSpanOrdinalKey.cs (17)
19
internal readonly unsafe struct StringSpanOrdinalKey : IEquatable<
StringSpanOrdinalKey
>
41
obj is
StringSpanOrdinalKey
wrapper && Equals(wrapper);
43
public bool Equals(
StringSpanOrdinalKey
other) =>
51
private readonly
StringSpanOrdinalKey
_left;
52
private readonly
StringSpanOrdinalKey
_right;
77
private readonly Dictionary<
StringSpanOrdinalKey
, TValue> _map;
86
_map = new Dictionary<
StringSpanOrdinalKey
, TValue>(capacity);
129
internal sealed class Vocabulary : Dictionary<
StringSpanOrdinalKey
, (int, string)>;
132
/// Custom JSON converter for <see cref="
StringSpanOrdinalKey
"/>.
134
internal sealed class StringSpanOrdinalKeyConverter : JsonConverter<
StringSpanOrdinalKey
>
136
public override
StringSpanOrdinalKey
ReadAsPropertyName(ref Utf8JsonReader reader, Type typeToConvert, JsonSerializerOptions options) =>
139
public override void WriteAsPropertyName(Utf8JsonWriter writer,
StringSpanOrdinalKey
value, JsonSerializerOptions options) =>
142
public override
StringSpanOrdinalKey
Read(ref Utf8JsonReader reader, Type typeToConvert, JsonSerializerOptions options) => new StringSpanOrdinalKey(reader.GetString()!);
143
public override void Write(Utf8JsonWriter writer,
StringSpanOrdinalKey
value, JsonSerializerOptions options) => writer.WriteStringValue(value.Data!);
173
/// Extension methods for <see cref="
StringSpanOrdinalKey
"/>.
177
public static unsafe bool TryGetValue<TValue>(this Dictionary<
StringSpanOrdinalKey
, TValue> map, ReadOnlySpan<char> key, out TValue value)
185
public static bool TryGetValue<TValue>(this Dictionary<
StringSpanOrdinalKey
, TValue> map, string key, out TValue value) =>