API Reference
ReaderOptions
Options controlling extraction behavior for DocumentReader.
Inheritance
- Object
- ReaderOptions
Constructors
public ReaderOptions() #Inherited Methods
public override Boolean Equals(Object obj) #BooleanParameters
- obj Object
Properties
public Nullable<Int64> MaxInputBytes { get; set; } #Optional maximum input size in bytes enforced by DocumentReader when reading from a file or seekable stream. When null, no size limit is enforced.
public Nullable<Int64> OpenXmlMaxCharactersInPart { get; set; } #OpenXML security: maximum characters allowed per part when opening OpenXML packages (best-effort). When null, the OpenXML SDK default is used.
public Int32 MaxChars { get; set; } #Maximum characters per emitted chunk (best-effort).
public Int32 MaxTableRows { get; set; } #Maximum number of table rows included per table chunk (best-effort).
public Boolean IncludeWordFootnotes { get; set; } #When true, include Word footnotes as a final chunk. Default: true.
public Boolean IncludePowerPointNotes { get; set; } #When true, include PowerPoint speaker notes when present. Default: true.
public Boolean ExcelHeadersInFirstRow { get; set; } #Excel: when true, treat the first row as headers. Default: true.
public Int32 ExcelChunkRows { get; set; } #Excel: number of worksheet rows per emitted chunk. Default: 200.
public String ExcelSheetName { get; set; } #Excel: optional sheet name. When null, all sheets are extracted.
public String ExcelA1Range { get; set; } #Excel: optional A1 range. When null, the sheet's used range is used.
public Boolean MarkdownChunkByHeadings { get; set; } #Markdown: when true, chunk by headings where possible. Default: true.
public MarkdownInputNormalizationOptions MarkdownInputNormalization { get; set; } #Markdown: optional input normalization applied before parser-aware chunking. This is intended for compact AI/chat markdown fixes while preserving default strict behavior when null.
public Boolean ComputeHashes { get; set; } #When true, computes source/chunk hashes for incremental indexing workflows. Default: true.