4 types derived from IngestionChunker
Microsoft.Extensions.DataIngestion (3)
Chunkers\HeaderChunker.cs (1)
17
public sealed class HeaderChunker :
IngestionChunker
<string>
Chunkers\SectionChunker.cs (1)
15
public sealed class SectionChunker :
IngestionChunker
<string>
Chunkers\SemanticSimilarityChunker.cs (1)
18
public sealed class SemanticSimilarityChunker :
IngestionChunker
<string>
Microsoft.Extensions.DataIngestion.Tests (1)
IngestionPipelineTests.cs (1)
176
internal class ImageChunker :
IngestionChunker
<DataContent>
18 references to IngestionChunker
Microsoft.Extensions.DataIngestion (2)
IngestionPipeline.cs (2)
28
private readonly
IngestionChunker
<T> _chunker;
43
IngestionChunker
<T> chunker,
Microsoft.Extensions.DataIngestion.Tests (16)
Chunkers\DocumentChunkerTests.cs (3)
14
protected abstract
IngestionChunker
<string> CreateDocumentChunker(int maxTokensPerChunk = 2_000, int overlapTokens = 500);
19
var
chunker = CreateDocumentChunker();
27
IngestionChunker
<string> chunker = CreateDocumentChunker();
Chunkers\SectionChunkerTests.cs (7)
14
protected override
IngestionChunker
<string> CreateDocumentChunker(int maxTokensPerChunk = 2_000, int overlapTokens = 500)
32
IngestionChunker
<string> chunker = CreateDocumentChunker();
65
IngestionChunker
<string> chunker = CreateDocumentChunker();
83
IngestionChunker
<string> chunker = CreateDocumentChunker();
126
IngestionChunker
<string> chunker = CreateDocumentChunker();
155
IngestionChunker
<string> chunker = CreateDocumentChunker(maxTokensPerChunk: 512);
176
IngestionChunker
<string> chunker = CreateDocumentChunker();
Chunkers\SemanticSimilarityChunkerTests.cs (5)
16
protected override
IngestionChunker
<string> CreateDocumentChunker(int maxTokensPerChunk = 2_000, int overlapTokens = 500)
24
private static
IngestionChunker
<string> CreateSemanticSimilarityChunker(TestEmbeddingGenerator embeddingClient, int maxTokensPerChunk = 2_000, int overlapTokens = 500)
56
IngestionChunker
<string> chunker = CreateSemanticSimilarityChunker(customGenerator);
99
IngestionChunker
<string> chunker = CreateSemanticSimilarityChunker(customGenerator);
175
IngestionChunker
<string> chunker = CreateSemanticSimilarityChunker(customGenerator, 200, 0);
IngestionPipelineTests.cs (1)
226
private static
IngestionChunker
<string> CreateChunker() => new HeaderChunker(new(TiktokenTokenizer.CreateForModel("gpt-4")));