PdfOcrExtractionNodeConfiguration
Namespace: Meshmakers.Octo.MeshAdapter.Nodes.Transform
Configuration for PDF OCR extraction node that uses IronOCR to extract text and data from PDF files
public record PdfOcrExtractionNodeConfiguration : SourceTargetPathNodeConfiguration, INodeConfiguration, IEquatable<NodeConfiguration>, ITargetPathNodeConfiguration, IEquatable<TargetPathNodeConfiguration>, IPathNodeConfiguration, IEquatable<SourceTargetPathNodeConfiguration>, IEquatable<PdfOcrExtractionNodeConfiguration>
Inheritance Object → NodeConfiguration → TargetPathNodeConfiguration → SourceTargetPathNodeConfiguration → PdfOcrExtractionNodeConfiguration
Implements INodeConfiguration, IEquatable<NodeConfiguration>, ITargetPathNodeConfiguration, IEquatable<TargetPathNodeConfiguration>, IPathNodeConfiguration, IEquatable<SourceTargetPathNodeConfiguration>, IEquatable<PdfOcrExtractionNodeConfiguration>
Properties
PageNumbers
Specific page numbers to process (if not set, all pages will be processed)
public Int32[] PageNumbers { get; set; }
Property Value
Language
OCR language code (e.g., 'en', 'de', 'fr')
public string Language { get; set; }
Property Value
ExtractTables
Whether to extract tables from the PDF
public bool ExtractTables { get; set; }
Property Value
TablesOutputPath
Output path for extracted tables
public string TablesOutputPath { get; set; }
Property Value
ExtractBarcodes
Whether to extract barcodes from the PDF
public bool ExtractBarcodes { get; set; }
Property Value
BarcodesOutputPath
Output path for extracted barcodes
public string BarcodesOutputPath { get; set; }
Property Value
IncludeConfidence
Whether to include OCR confidence score in output
public bool IncludeConfidence { get; set; }
Property Value
ConfidenceOutputPath
Output path for OCR confidence score
public string ConfidenceOutputPath { get; set; }
Property Value
ContinueOnError
Whether to continue processing if OCR extraction fails
public bool ContinueOnError { get; set; }
Property Value
Path
public string Path { get; set; }
Property Value
TargetPath
public string TargetPath { get; set; }
Property Value
TargetValueWriteMode
public TargetValueWriteModes TargetValueWriteMode { get; set; }
Property Value
TargetValueWriteModes
TargetValueKind
public ValueKinds TargetValueKind { get; set; }
Property Value
ValueKinds
DocumentMode
public DocumentModes DocumentMode { get; set; }
Property Value
DocumentModes
Description
public string Description { get; set; }
Property Value
Constructors
PdfOcrExtractionNodeConfiguration()
public PdfOcrExtractionNodeConfiguration()