5 types derived from IngestionChunker
Microsoft.Extensions.DataIngestion (4)
Chunkers\DocumentTokenChunker.cs (1)
23
public sealed class DocumentTokenChunker :
IngestionChunker
<string>
Chunkers\HeaderChunker.cs (1)
17
public sealed class HeaderChunker :
IngestionChunker
<string>
Chunkers\SectionChunker.cs (1)
15
public sealed class SectionChunker :
IngestionChunker
<string>
Chunkers\SemanticSimilarityChunker.cs (1)
18
public sealed class SemanticSimilarityChunker :
IngestionChunker
<string>
Microsoft.Extensions.DataIngestion.Tests (1)
IngestionPipelineTests.cs (1)
176
internal class ImageChunker :
IngestionChunker
<DataContent>
23 references to IngestionChunker
Microsoft.Extensions.DataIngestion (2)
IngestionPipeline.cs (2)
28
private readonly
IngestionChunker
<T> _chunker;
43
IngestionChunker
<T> chunker,
Microsoft.Extensions.DataIngestion.Tests (21)
Chunkers\DocumentChunkerTests.cs (3)
14
protected abstract
IngestionChunker
<string> CreateDocumentChunker(int maxTokensPerChunk = 2_000, int overlapTokens = 500);
19
var
chunker = CreateDocumentChunker();
27
IngestionChunker
<string> chunker = CreateDocumentChunker();
Chunkers\DocumentTokenChunkerTests.cs (1)
26
IngestionChunker
<string> chunker = CreateDocumentChunker();
Chunkers\NoOverlapTokenChunkerTests.cs (3)
14
protected override
IngestionChunker
<string> CreateDocumentChunker(int maxTokensPerChunk = 2_000, int overlapTokens = 500)
32
IngestionChunker
<string> chunker = CreateDocumentChunker(maxTokensPerChunk: 512);
53
IngestionChunker
<string> chunker = CreateDocumentChunker(maxTokensPerChunk: 200, overlapTokens: 0);
Chunkers\OverlapTokenChunkerTests.cs (1)
15
protected override
IngestionChunker
<string> CreateDocumentChunker(int maxTokensPerChunk = 2_000, int overlapTokens = 500)
Chunkers\SectionChunkerTests.cs (7)
14
protected override
IngestionChunker
<string> CreateDocumentChunker(int maxTokensPerChunk = 2_000, int overlapTokens = 500)
32
IngestionChunker
<string> chunker = CreateDocumentChunker();
65
IngestionChunker
<string> chunker = CreateDocumentChunker();
83
IngestionChunker
<string> chunker = CreateDocumentChunker();
126
IngestionChunker
<string> chunker = CreateDocumentChunker();
155
IngestionChunker
<string> chunker = CreateDocumentChunker(maxTokensPerChunk: 512);
176
IngestionChunker
<string> chunker = CreateDocumentChunker();
Chunkers\SemanticSimilarityChunkerTests.cs (5)
16
protected override
IngestionChunker
<string> CreateDocumentChunker(int maxTokensPerChunk = 2_000, int overlapTokens = 500)
24
private static
IngestionChunker
<string> CreateSemanticSimilarityChunker(TestEmbeddingGenerator embeddingClient, int maxTokensPerChunk = 2_000, int overlapTokens = 500)
56
IngestionChunker
<string> chunker = CreateSemanticSimilarityChunker(customGenerator);
99
IngestionChunker
<string> chunker = CreateSemanticSimilarityChunker(customGenerator);
175
IngestionChunker
<string> chunker = CreateSemanticSimilarityChunker(customGenerator, 200, 0);
IngestionPipelineTests.cs (1)
226
private static
IngestionChunker
<string> CreateChunker() => new HeaderChunker(new(TiktokenTokenizer.CreateForModel("gpt-4")));