From 647540b5e07a523a768ae0cdd5c9818dda0d5364 Mon Sep 17 00:00:00 2001 From: venkateshwaransf5013 Date: Thu, 5 Mar 2026 20:31:25 +0530 Subject: [PATCH 01/13] Added the UG content for SmartDataExtractor --- Document-Processing-toc.html | 31 +++++++++++++++++++++++++++++++ 1 file changed, 31 insertions(+) diff --git a/Document-Processing-toc.html b/Document-Processing-toc.html index 166c62ed1..8da05da40 100644 --- a/Document-Processing-toc.html +++ b/Document-Processing-toc.html @@ -113,6 +113,37 @@
  • NuGet Packages
  • +
  • SmartDataExtractor + +
  • PDF
  • + diff --git a/Document-Processing/SmartDataExtractor/NET/TableExtractor/Features.md b/Document-Processing/SmartDataExtractor/NET/TableExtractor/Features.md index 72edaa2f7..e25dc6f4a 100644 --- a/Document-Processing/SmartDataExtractor/NET/TableExtractor/Features.md +++ b/Document-Processing/SmartDataExtractor/NET/TableExtractor/Features.md @@ -43,7 +43,7 @@ using (FileStream stream = new FileStream("Input.pdf", FileMode.Open, FileAccess {% endtabs %} -## Extract Tables with detect borderless tables +## Extract Tables with detect border less tables To extract structured table data from a PDF document that contains tables without visible borders using the **ExtractTableAsJson** method of the **TableExtractor** class, refer to the following code examples. @@ -135,6 +135,8 @@ using (FileStream stream = new FileStream("Input.pdf", FileMode.Open, FileAccess File.WriteAllText("Output.json", data, Encoding.UTF8); } +{% endhighlight %} + {% endtabs %} ## Extract table data asynchronously from a PDF document From ded4087cd495d5976dbed1679a49852001b9ff02 Mon Sep 17 00:00:00 2001 From: venkateshwaransf5013 Date: Mon, 9 Mar 2026 12:32:44 +0530 Subject: [PATCH 07/13] Resolved the CI issues --- Document-Processing-toc.html | 26 +++++++++---------- .../Assemblies-Required.md | 0 ...ile-missing-error-in-smart-data-extractor} | 6 +---- .../NET/SmartDataExtractor}/Features.md | 0 .../NuGet-Packages-Required.md | 0 .../NET/SmartDataExtractor/faq.md | 13 ++++++++++ .../NET/SmartDataExtractor}/overview.md | 0 .../Assemblies-Required.md | 0 ...le-missing-error-in-smart-table-extractor} | 6 +---- .../NET/SmartTableExtractor}/Features.md | 0 .../NuGet-Packages-Required.md | 0 .../NET/SmartTableExtractor/faq.md | 13 ++++++++++ .../NET/SmartTableExtractor}/overview.md | 0 .../NET/overview.md | 0 .../NET/assemblies-required.md | 0 .../NET/nuGet-packages-required.md | 0 .../SmartFormRecognizer/NET/overview.md | 0 .../NET/recognize-forms.md | 0 .../NET/smart-form-recognizer.md | 0 .../NET/working-with-recognize-option.md | 0 20 files changed, 41 insertions(+), 23 deletions(-) rename Document-Processing/{SmartDataExtractor/NET/DataExtractor => DataExtraction/NET/SmartDataExtractor}/Assemblies-Required.md (100%) rename Document-Processing/{SmartDataExtractor/NET/DataExtractor/FAQ/how to resolve the ONNX file missing error in Smart Data Extractor.md => DataExtraction/NET/SmartDataExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-data-extractor} (86%) rename Document-Processing/{SmartDataExtractor/NET/DataExtractor => DataExtraction/NET/SmartDataExtractor}/Features.md (100%) rename Document-Processing/{SmartDataExtractor/NET/DataExtractor => DataExtraction/NET/SmartDataExtractor}/NuGet-Packages-Required.md (100%) create mode 100644 Document-Processing/DataExtraction/NET/SmartDataExtractor/faq.md rename Document-Processing/{SmartDataExtractor/NET/DataExtractor => DataExtraction/NET/SmartDataExtractor}/overview.md (100%) rename Document-Processing/{SmartDataExtractor/NET/TableExtractor => DataExtraction/NET/SmartTableExtractor}/Assemblies-Required.md (100%) rename Document-Processing/{SmartDataExtractor/NET/TableExtractor/FAQ/how to resolve the ONNX file missing error in Smart Table Extractor.md => DataExtraction/NET/SmartTableExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-table-extractor} (86%) rename Document-Processing/{SmartDataExtractor/NET/TableExtractor => DataExtraction/NET/SmartTableExtractor}/Features.md (100%) rename Document-Processing/{SmartDataExtractor/NET/TableExtractor => DataExtraction/NET/SmartTableExtractor}/NuGet-Packages-Required.md (100%) create mode 100644 Document-Processing/DataExtraction/NET/SmartTableExtractor/faq.md rename Document-Processing/{SmartDataExtractor/NET/TableExtractor => DataExtraction/NET/SmartTableExtractor}/overview.md (100%) rename Document-Processing/{SmartDataExtractor => DataExtraction}/NET/overview.md (100%) rename Document-Processing/{SmartDataExtractor => DataExtraction}/SmartFormRecognizer/NET/assemblies-required.md (100%) rename Document-Processing/{SmartDataExtractor => DataExtraction}/SmartFormRecognizer/NET/nuGet-packages-required.md (100%) rename Document-Processing/{SmartDataExtractor => DataExtraction}/SmartFormRecognizer/NET/overview.md (100%) rename Document-Processing/{SmartDataExtractor => DataExtraction}/SmartFormRecognizer/NET/recognize-forms.md (100%) rename Document-Processing/{SmartDataExtractor => DataExtraction}/SmartFormRecognizer/NET/smart-form-recognizer.md (100%) rename Document-Processing/{SmartDataExtractor => DataExtraction}/SmartFormRecognizer/NET/working-with-recognize-option.md (100%) diff --git a/Document-Processing-toc.html b/Document-Processing-toc.html index 50a387f0b..e20297275 100644 --- a/Document-Processing-toc.html +++ b/Document-Processing-toc.html @@ -116,25 +116,25 @@
  • SmartDataExtractor
    • - NET + NET
      • - DataExtractor + DataExtractor
        • - TableExtractor + TableExtractor
          • - Assemblies Required + Assemblies Required
          • - NuGet Packages Required + NuGet Packages Required
          • - Features + Features
          • - FAQ + FAQ
          • diff --git a/Document-Processing/SmartDataExtractor/NET/DataExtractor/Assemblies-Required.md b/Document-Processing/DataExtraction/NET/SmartDataExtractor/Assemblies-Required.md similarity index 100% rename from Document-Processing/SmartDataExtractor/NET/DataExtractor/Assemblies-Required.md rename to Document-Processing/DataExtraction/NET/SmartDataExtractor/Assemblies-Required.md diff --git a/Document-Processing/SmartDataExtractor/NET/DataExtractor/FAQ/how to resolve the ONNX file missing error in Smart Data Extractor.md b/Document-Processing/DataExtraction/NET/SmartDataExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-data-extractor similarity index 86% rename from Document-Processing/SmartDataExtractor/NET/DataExtractor/FAQ/how to resolve the ONNX file missing error in Smart Data Extractor.md rename to Document-Processing/DataExtraction/NET/SmartDataExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-data-extractor index 18e783b17..1bebd8bd8 100644 --- a/Document-Processing/SmartDataExtractor/NET/DataExtractor/FAQ/how to resolve the ONNX file missing error in Smart Data Extractor.md +++ b/Document-Processing/DataExtraction/NET/SmartDataExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-data-extractor @@ -24,14 +24,10 @@ Solution: 1. Run a build so the application output is generated under `bin\Debug\netX.X\runtimes` (or your configured build configuration and target framework). 2. Locate the project's build output `bin` path (for example: `bin\Debug\net6.0\runtimes`). -3. Place all required ONNX model files into a `runtimes\models` folder inside that bin path (for example: `bin\Debug\net6.0\runtimes\models\syncfusion_doclayout.onnx`). +3. Place all required ONNX model files into a `runtimes\models` folder inside that bin path. 4. In Visual Studio, for each ONNX file set **Properties → Copy to Output Directory → Copy always** so the model is included on every build. 5. Rebuild and run your project. The extractor should now find the ONNX models and operate correctly. -Screenshot placeholder - -Add a screenshot showing the exception or the `runtimes\models` folder layout. Save the image in the repo (suggested path relative to this file): `../images/onnx-missing.png` and include it here: - Notes: - If you publish your application, ensure the `runtimes\models` folder and ONNX files are included in the publish output (you may need to mark files as content in the project file or use a entry). diff --git a/Document-Processing/SmartDataExtractor/NET/DataExtractor/Features.md b/Document-Processing/DataExtraction/NET/SmartDataExtractor/Features.md similarity index 100% rename from Document-Processing/SmartDataExtractor/NET/DataExtractor/Features.md rename to Document-Processing/DataExtraction/NET/SmartDataExtractor/Features.md diff --git a/Document-Processing/SmartDataExtractor/NET/DataExtractor/NuGet-Packages-Required.md b/Document-Processing/DataExtraction/NET/SmartDataExtractor/NuGet-Packages-Required.md similarity index 100% rename from Document-Processing/SmartDataExtractor/NET/DataExtractor/NuGet-Packages-Required.md rename to Document-Processing/DataExtraction/NET/SmartDataExtractor/NuGet-Packages-Required.md diff --git a/Document-Processing/DataExtraction/NET/SmartDataExtractor/faq.md b/Document-Processing/DataExtraction/NET/SmartDataExtractor/faq.md new file mode 100644 index 000000000..ad16258f9 --- /dev/null +++ b/Document-Processing/DataExtraction/NET/SmartDataExtractor/faq.md @@ -0,0 +1,13 @@ +--- +title: Extract structured data from PDF and image documents in .NET | Syncfusion +description: Syncfusion® Smart Data Extractor is a .NET library that extracts tables, form fields, text blocks, and images from PDF and image documents, producing PDFs and structured JSON for verification, automation and processing. +platform: document-processing +control: SmartDataExtractor +documentation: UG +--- + +# Frequently Asked Questions in Blazor SfPdfViewer Component + +Common questions and answers for using the Syncfusion Blazor SfPdfViewer component. + +* [How to Resolve the ONNX File Missing Error in Smart Data Extractor?](./FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-data-extractor) diff --git a/Document-Processing/SmartDataExtractor/NET/DataExtractor/overview.md b/Document-Processing/DataExtraction/NET/SmartDataExtractor/overview.md similarity index 100% rename from Document-Processing/SmartDataExtractor/NET/DataExtractor/overview.md rename to Document-Processing/DataExtraction/NET/SmartDataExtractor/overview.md diff --git a/Document-Processing/SmartDataExtractor/NET/TableExtractor/Assemblies-Required.md b/Document-Processing/DataExtraction/NET/SmartTableExtractor/Assemblies-Required.md similarity index 100% rename from Document-Processing/SmartDataExtractor/NET/TableExtractor/Assemblies-Required.md rename to Document-Processing/DataExtraction/NET/SmartTableExtractor/Assemblies-Required.md diff --git a/Document-Processing/SmartDataExtractor/NET/TableExtractor/FAQ/how to resolve the ONNX file missing error in Smart Table Extractor.md b/Document-Processing/DataExtraction/NET/SmartTableExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-table-extractor similarity index 86% rename from Document-Processing/SmartDataExtractor/NET/TableExtractor/FAQ/how to resolve the ONNX file missing error in Smart Table Extractor.md rename to Document-Processing/DataExtraction/NET/SmartTableExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-table-extractor index 9f2a4da83..a5976520f 100644 --- a/Document-Processing/SmartDataExtractor/NET/TableExtractor/FAQ/how to resolve the ONNX file missing error in Smart Table Extractor.md +++ b/Document-Processing/DataExtraction/NET/SmartTableExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-table-extractor @@ -24,14 +24,10 @@ Solution: 1. Run a build so the application output is generated under `bin\Debug\netX.X\runtimes` (or your configured build configuration and target framework). 2. Locate the project's build output `bin` path (for example: `bin\Debug\net6.0\runtimes`). -3. Place all required ONNX model files into a `runtimes\models` folder inside that bin path (for example: `bin\Debug\net6.0\runtimes\models\syncfusion_doclayout.onnx`). +3. Place all required ONNX model files into a `runtimes\models` folder inside that bin path. 4. In Visual Studio, for each ONNX file set **Properties → Copy to Output Directory → Copy always** so the model is included on every build. 5. Rebuild and run your project. The extractor should now find the ONNX models and operate correctly. -Screenshot placeholder - -Add a screenshot showing the exception or the `runtimes\models` folder layout. Save the image in the repo (suggested path relative to this file): `../images/onnx-missing.png` and include it here: - Notes: - If you publish your application, ensure the `runtimes\models` folder and ONNX files are included in the publish output (you may need to mark files as content in the project file or use a entry). diff --git a/Document-Processing/SmartDataExtractor/NET/TableExtractor/Features.md b/Document-Processing/DataExtraction/NET/SmartTableExtractor/Features.md similarity index 100% rename from Document-Processing/SmartDataExtractor/NET/TableExtractor/Features.md rename to Document-Processing/DataExtraction/NET/SmartTableExtractor/Features.md diff --git a/Document-Processing/SmartDataExtractor/NET/TableExtractor/NuGet-Packages-Required.md b/Document-Processing/DataExtraction/NET/SmartTableExtractor/NuGet-Packages-Required.md similarity index 100% rename from Document-Processing/SmartDataExtractor/NET/TableExtractor/NuGet-Packages-Required.md rename to Document-Processing/DataExtraction/NET/SmartTableExtractor/NuGet-Packages-Required.md diff --git a/Document-Processing/DataExtraction/NET/SmartTableExtractor/faq.md b/Document-Processing/DataExtraction/NET/SmartTableExtractor/faq.md new file mode 100644 index 000000000..43cc23835 --- /dev/null +++ b/Document-Processing/DataExtraction/NET/SmartTableExtractor/faq.md @@ -0,0 +1,13 @@ +--- +title: Extract structured data from PDF and image documents in .NET | Syncfusion +description: Syncfusion® Smart Data Extractor is a .NET library that extracts tables, form fields, text blocks, and images from PDF and image documents, producing PDFs and structured JSON for verification, automation and processing. +platform: document-processing +control: SmartDataExtractor +documentation: UG +--- + +# Frequently Asked Questions in Blazor SfPdfViewer Component + +Common questions and answers for using the Syncfusion Data Extraction Library. + +* [How to Resolve the ONNX File Missing Error in Smart Table Extractor?](./FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-table-extractor) diff --git a/Document-Processing/SmartDataExtractor/NET/TableExtractor/overview.md b/Document-Processing/DataExtraction/NET/SmartTableExtractor/overview.md similarity index 100% rename from Document-Processing/SmartDataExtractor/NET/TableExtractor/overview.md rename to Document-Processing/DataExtraction/NET/SmartTableExtractor/overview.md diff --git a/Document-Processing/SmartDataExtractor/NET/overview.md b/Document-Processing/DataExtraction/NET/overview.md similarity index 100% rename from Document-Processing/SmartDataExtractor/NET/overview.md rename to Document-Processing/DataExtraction/NET/overview.md diff --git a/Document-Processing/SmartDataExtractor/SmartFormRecognizer/NET/assemblies-required.md b/Document-Processing/DataExtraction/SmartFormRecognizer/NET/assemblies-required.md similarity index 100% rename from Document-Processing/SmartDataExtractor/SmartFormRecognizer/NET/assemblies-required.md rename to Document-Processing/DataExtraction/SmartFormRecognizer/NET/assemblies-required.md diff --git a/Document-Processing/SmartDataExtractor/SmartFormRecognizer/NET/nuGet-packages-required.md b/Document-Processing/DataExtraction/SmartFormRecognizer/NET/nuGet-packages-required.md similarity index 100% rename from Document-Processing/SmartDataExtractor/SmartFormRecognizer/NET/nuGet-packages-required.md rename to Document-Processing/DataExtraction/SmartFormRecognizer/NET/nuGet-packages-required.md diff --git a/Document-Processing/SmartDataExtractor/SmartFormRecognizer/NET/overview.md b/Document-Processing/DataExtraction/SmartFormRecognizer/NET/overview.md similarity index 100% rename from Document-Processing/SmartDataExtractor/SmartFormRecognizer/NET/overview.md rename to Document-Processing/DataExtraction/SmartFormRecognizer/NET/overview.md diff --git a/Document-Processing/SmartDataExtractor/SmartFormRecognizer/NET/recognize-forms.md b/Document-Processing/DataExtraction/SmartFormRecognizer/NET/recognize-forms.md similarity index 100% rename from Document-Processing/SmartDataExtractor/SmartFormRecognizer/NET/recognize-forms.md rename to Document-Processing/DataExtraction/SmartFormRecognizer/NET/recognize-forms.md diff --git a/Document-Processing/SmartDataExtractor/SmartFormRecognizer/NET/smart-form-recognizer.md b/Document-Processing/DataExtraction/SmartFormRecognizer/NET/smart-form-recognizer.md similarity index 100% rename from Document-Processing/SmartDataExtractor/SmartFormRecognizer/NET/smart-form-recognizer.md rename to Document-Processing/DataExtraction/SmartFormRecognizer/NET/smart-form-recognizer.md diff --git a/Document-Processing/SmartDataExtractor/SmartFormRecognizer/NET/working-with-recognize-option.md b/Document-Processing/DataExtraction/SmartFormRecognizer/NET/working-with-recognize-option.md similarity index 100% rename from Document-Processing/SmartDataExtractor/SmartFormRecognizer/NET/working-with-recognize-option.md rename to Document-Processing/DataExtraction/SmartFormRecognizer/NET/working-with-recognize-option.md From ba382a6277b9b797747ede8f1cbe315fb207af24 Mon Sep 17 00:00:00 2001 From: venkateshwaransf5013 Date: Mon, 9 Mar 2026 12:38:42 +0530 Subject: [PATCH 08/13] added changes --- Document-Processing-toc.html | 16 ++++++++-------- 1 file changed, 8 insertions(+), 8 deletions(-) diff --git a/Document-Processing-toc.html b/Document-Processing-toc.html index e20297275..9ea1e0f39 100644 --- a/Document-Processing-toc.html +++ b/Document-Processing-toc.html @@ -113,7 +113,7 @@
          • NuGet Packages
          • -
          • SmartDataExtractor +
          • DataExtraction
            • NET @@ -3199,26 +3199,26 @@
          • -
          • SmartDataExtractor +
          • DataExtraction
            • - SmartFormRecognizer + SmartFormRecognizer
            • NET
            • From 2e3bf50cc60619a421424856eb401586388353f7 Mon Sep 17 00:00:00 2001 From: venkateshwaransf5013 Date: Mon, 9 Mar 2026 13:15:41 +0530 Subject: [PATCH 09/13] Resolved the CI issues --- Document-Processing-toc.html | 6 ++++-- .../SmartDataExtractor/Assemblies-Required.md | 4 ++-- ...file-missing-error-in-smart-data-extractor | 7 ++++--- .../NET/SmartDataExtractor/Features.md | 5 +++-- .../NuGet-Packages-Required.md | 15 ++++++++------- .../NET/SmartDataExtractor/faq.md | 9 +++++---- .../NET/SmartDataExtractor/overview.md | 5 +++-- .../Assemblies-Required.md | 4 ++-- .../NET/SmartTableExtractor/Features.md | 5 +++-- .../NuGet-Packages-Required.md | 15 ++++++++------- .../NET/SmartTableExtractor/faq.md | 11 ++++++----- .../NET/SmartTableExtractor/overview.md | 5 +++-- .../DataExtraction/NET/overview.md | 19 +++++++++++++++---- 13 files changed, 66 insertions(+), 44 deletions(-) diff --git a/Document-Processing-toc.html b/Document-Processing-toc.html index 9ea1e0f39..4e633af2f 100644 --- a/Document-Processing-toc.html +++ b/Document-Processing-toc.html @@ -113,7 +113,8 @@
            • NuGet Packages
            • -
            • DataExtraction +
            • + DataExtraction
              • NET @@ -3199,7 +3200,8 @@
            • -
            • DataExtraction +
            • + DataExtraction
              • SmartFormRecognizer diff --git a/Document-Processing/DataExtraction/NET/SmartDataExtractor/Assemblies-Required.md b/Document-Processing/DataExtraction/NET/SmartDataExtractor/Assemblies-Required.md index a1303194a..1a4bd8c5f 100644 --- a/Document-Processing/DataExtraction/NET/SmartDataExtractor/Assemblies-Required.md +++ b/Document-Processing/DataExtraction/NET/SmartDataExtractor/Assemblies-Required.md @@ -1,6 +1,6 @@ --- -title: Extract structured data from PDF and image documents in .NET | Syncfusion -description: Syncfusion® Smart Data Extractor is a .NET library that extracts tables, form fields, text blocks, and images from PDF and image documents, producing PDFs and structured JSON for verification, automation and processing. +title: Extract structured data from PDF & image Files in .NET | Syncfusion +description: Syncfusion® Smart Data Extractor is a .NET library that extracts tables, forms, text, and images from documents, producing PDFs and JSON. platform: document-processing control: SmartDataExtractor documentation: UG diff --git a/Document-Processing/DataExtraction/NET/SmartDataExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-data-extractor b/Document-Processing/DataExtraction/NET/SmartDataExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-data-extractor index 1bebd8bd8..c7ad96616 100644 --- a/Document-Processing/DataExtraction/NET/SmartDataExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-data-extractor +++ b/Document-Processing/DataExtraction/NET/SmartDataExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-data-extractor @@ -1,9 +1,10 @@ --- -title: Extract structured data from PDF and image documents in .NET | Syncfusion -description: Syncfusion® Smart Data Extractor is a .NET library that extracts tables, form fields, text blocks, and images from PDF and image documents, producing PDFs and structured JSON for verification, automation and processing. -platform: documentProcessing +title: Extract structured data from PDF & image Files in .NET | Syncfusion +description: Syncfusion® Smart Data Extractor is a .NET library that extracts tables, forms, text, and images from documents, producing PDFs and JSON. +platform: document-processing control: SmartDataExtractor documentation: UG +keywords: Assemblies --- # How to resolve the “ONNX file missing” error in Smart Data Extractor diff --git a/Document-Processing/DataExtraction/NET/SmartDataExtractor/Features.md b/Document-Processing/DataExtraction/NET/SmartDataExtractor/Features.md index 4a6459702..f6e646354 100644 --- a/Document-Processing/DataExtraction/NET/SmartDataExtractor/Features.md +++ b/Document-Processing/DataExtraction/NET/SmartDataExtractor/Features.md @@ -1,9 +1,10 @@ --- -title: Extract structured data from PDF and image documents in .NET | Syncfusion -description: Syncfusion® Smart Data Extractor is a .NET library that extracts tables, form fields, text blocks, and images from PDF and image documents, producing PDFs and structured JSON for verification, automation and processing. +title: Extract structured data from PDF & image Files in .NET | Syncfusion +description: Syncfusion® Smart Data Extractor is a .NET library that extracts tables, forms, text, and images from documents, producing PDFs and JSON. platform: document-processing control: SmartDataExtractor documentation: UG +keywords: Assemblies --- # SmartDataExtractor Features diff --git a/Document-Processing/DataExtraction/NET/SmartDataExtractor/NuGet-Packages-Required.md b/Document-Processing/DataExtraction/NET/SmartDataExtractor/NuGet-Packages-Required.md index 8eaf451f8..84fe35abc 100644 --- a/Document-Processing/DataExtraction/NET/SmartDataExtractor/NuGet-Packages-Required.md +++ b/Document-Processing/DataExtraction/NET/SmartDataExtractor/NuGet-Packages-Required.md @@ -1,9 +1,10 @@ --- -title: Extract structured data from PDF and image documents in .NET | Syncfusion -description: Syncfusion® Smart Data Extractor is a .NET library that extracts tables, form fields, text blocks, and images from PDF and image documents, producing PDFs and structured JSON for verification, automation and processing. +title: Extract structured data from PDF & image Files in .NET | Syncfusion +description: Syncfusion® Smart Data Extractor is a .NET library that extracts tables, forms, text, and images from documents, producing PDFs and JSON. platform: document-processing control: SmartDataExtractor documentation: UG +keywords: Assemblies --- # NuGet Packages Required for SmartDataExtractor @@ -24,7 +25,7 @@ Windows Forms
                Console Application (Targeting .NET Framework) -{{'[Syncfusion.SmartDataExtractor.WinForms.nupkg](https://www.nuget.org/packages/Syncfusion.SmartDataExtractor.WinForms/)'| markdownify }} +{{'[Syncfusion.SmartDataExtractor.WinForms.nupkg]'| markdownify }} @@ -32,7 +33,7 @@ Console Application (Targeting .NET Framework) WPF -{{'[Syncfusion.SmartDataExtractor.Wpf.nupkg](https://www.nuget.org/packages/Syncfusion.SmartDataExtractor.Wpf/)'| markdownify }} +{{'[Syncfusion.SmartDataExtractor.Wpf.nupkg]'| markdownify }} @@ -40,7 +41,7 @@ WPF ASP.NET MVC5 -{{'[Syncfusion.SmartDataExtractor.AspNet.Mvc5.nupkg](https://www.nuget.org/packages/Syncfusion.SmartDataExtractor.AspNet.Mvc5/)'| markdownify }} +{{'[Syncfusion.SmartDataExtractor.AspNet.Mvc5.nupkg]'| markdownify }} @@ -50,7 +51,7 @@ Console Application (Targeting .NET Core)
                Blazor -{{'[Syncfusion.SmartDataExtractor.Net.Core.nupkg](https://www.nuget.org/packages/Syncfusion.SmartDataExtractor.Net.Core/)'| markdownify }} +{{'[Syncfusion.SmartDataExtractor.Net.Core.nupkg]'| markdownify }} @@ -59,7 +60,7 @@ Windows UI (WinUI)
                .NET Multi-platform App UI (.NET MAUI) -{{'[Syncfusion.SmartDataExtractor.NET.nupkg](https://www.nuget.org/packages/Syncfusion.SmartDataExtractor.NET/)'| markdownify }} +{{'[Syncfusion.SmartDataExtractor.NET.nupkg]'| markdownify }} diff --git a/Document-Processing/DataExtraction/NET/SmartDataExtractor/faq.md b/Document-Processing/DataExtraction/NET/SmartDataExtractor/faq.md index ad16258f9..edc04f8b7 100644 --- a/Document-Processing/DataExtraction/NET/SmartDataExtractor/faq.md +++ b/Document-Processing/DataExtraction/NET/SmartDataExtractor/faq.md @@ -1,13 +1,14 @@ --- -title: Extract structured data from PDF and image documents in .NET | Syncfusion -description: Syncfusion® Smart Data Extractor is a .NET library that extracts tables, form fields, text blocks, and images from PDF and image documents, producing PDFs and structured JSON for verification, automation and processing. +title: Extract structured data from PDF & image Files in .NET | Syncfusion +description: Syncfusion® Smart Data Extractor is a .NET library that extracts tables, forms, text, and images from documents, producing PDFs and JSON. platform: document-processing control: SmartDataExtractor documentation: UG +keywords: Assemblies --- -# Frequently Asked Questions in Blazor SfPdfViewer Component +# Frequently Asked Questions in Data Extractor Library -Common questions and answers for using the Syncfusion Blazor SfPdfViewer component. +Common questions and answers for using the Syncfusion Data Extractor. * [How to Resolve the ONNX File Missing Error in Smart Data Extractor?](./FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-data-extractor) diff --git a/Document-Processing/DataExtraction/NET/SmartDataExtractor/overview.md b/Document-Processing/DataExtraction/NET/SmartDataExtractor/overview.md index 74b052334..6eaba6276 100644 --- a/Document-Processing/DataExtraction/NET/SmartDataExtractor/overview.md +++ b/Document-Processing/DataExtraction/NET/SmartDataExtractor/overview.md @@ -1,9 +1,10 @@ --- -title: Extract structured data from PDF and image documents in .NET | Syncfusion -description: Syncfusion® Smart Data Extractor is a .NET library that extracts tables, form fields, text blocks, and images from PDF and image documents, producing PDFs and structured JSON for verification, automation and processing. +title: Extract structured data from PDF & image Files in .NET | Syncfusion +description: Syncfusion® Smart Data Extractor is a .NET library that extracts tables, forms, text, and images from documents, producing PDFs and JSON. platform: document-processing control: SmartDataExtractor documentation: UG +keywords: Assemblies --- # Overview of SmartDataExtractor diff --git a/Document-Processing/DataExtraction/NET/SmartTableExtractor/Assemblies-Required.md b/Document-Processing/DataExtraction/NET/SmartTableExtractor/Assemblies-Required.md index 15bcda765..1d6964ab3 100644 --- a/Document-Processing/DataExtraction/NET/SmartTableExtractor/Assemblies-Required.md +++ b/Document-Processing/DataExtraction/NET/SmartTableExtractor/Assemblies-Required.md @@ -1,7 +1,7 @@ --- title: Extract tables from PDF and image documents in .NET | Syncfusion -description: Syncfusion® Smart Table Extractor is a .NET library that extracts tabular data from PDF documents. It detects table regions, header rows, columns, cell spans (merged cells), and provides structured JSON. -platform: SmartTableExtractor +description: Syncfusion® Smart Table Extractor detects tables in PDFs, including headers, columns, and merged cells, outputting JSON. +platform: document-processing control: PDF documentation: UG keywords: Assemblies diff --git a/Document-Processing/DataExtraction/NET/SmartTableExtractor/Features.md b/Document-Processing/DataExtraction/NET/SmartTableExtractor/Features.md index e25dc6f4a..be273fbfa 100644 --- a/Document-Processing/DataExtraction/NET/SmartTableExtractor/Features.md +++ b/Document-Processing/DataExtraction/NET/SmartTableExtractor/Features.md @@ -1,9 +1,10 @@ --- title: Extract tables from PDF and image documents in .NET | Syncfusion -description: Syncfusion® Smart Table Extractor is a .NET library that extracts tabular data from PDF documents. It detects table regions, header rows, columns, cell spans (merged cells), and provides structured JSON. -platform: SmartTableExtractor +description: Syncfusion® Smart Table Extractor detects tables in PDFs, including headers, columns, and merged cells, outputting JSON. +platform: document-processing control: PDF documentation: UG +keywords: Assemblies --- # SmartTableExtractor Features diff --git a/Document-Processing/DataExtraction/NET/SmartTableExtractor/NuGet-Packages-Required.md b/Document-Processing/DataExtraction/NET/SmartTableExtractor/NuGet-Packages-Required.md index 561370093..e59ea9370 100644 --- a/Document-Processing/DataExtraction/NET/SmartTableExtractor/NuGet-Packages-Required.md +++ b/Document-Processing/DataExtraction/NET/SmartTableExtractor/NuGet-Packages-Required.md @@ -1,9 +1,10 @@ --- title: Extract tables from PDF and image documents in .NET | Syncfusion -description: Syncfusion® Smart Table Extractor is a .NET library that extracts tabular data from PDF documents. It detects table regions, header rows, columns, cell spans (merged cells), and provides structured JSON. -platform: SmartTableExtractor +description: Syncfusion® Smart Table Extractor detects tables in PDFs, including headers, columns, and merged cells, outputting JSON. +platform: document-processing control: PDF documentation: UG +keywords: Assemblies --- # NuGet Packages Required for SmartTableExtractor @@ -24,7 +25,7 @@ Windows Forms
                Console Application (Targeting .NET Framework) -{{'[Syncfusion.SmartTableExtractor.WinForms.nupkg](https://www.nuget.org/packages/Syncfusion.SmartTableExtractor.WinForms/)'| markdownify }} +{{'[Syncfusion.SmartTableExtractor.WinForms.nupkg]'| markdownify }} @@ -32,7 +33,7 @@ Console Application (Targeting .NET Framework) WPF -{{'[Syncfusion.SmartTableExtractor.Wpf.nupkg](https://www.nuget.org/packages/Syncfusion.SmartTableExtractor.Wpf/)'| markdownify }} +{{'[Syncfusion.SmartTableExtractor.Wpf.nupkg]'| markdownify }} @@ -40,7 +41,7 @@ WPF ASP.NET MVC5 -{{'[Syncfusion.SmartTableExtractor.AspNet.Mvc5.nupkg](https://www.nuget.org/packages/Syncfusion.SmartTableExtractor.AspNet.Mvc5/)'| markdownify }} +{{'[Syncfusion.SmartTableExtractor.AspNet.Mvc5.nupkg]'| markdownify }} @@ -50,7 +51,7 @@ Console Application (Targeting .NET Core)
                Blazor -{{'[Syncfusion.SmartTableExtractor.Net.Core.nupkg](https://www.nuget.org/packages/Syncfusion.SmartTableExtractor.Net.Core/)'| markdownify }} +{{'[Syncfusion.SmartTableExtractor.Net.Core.nupkg]'| markdownify }} @@ -59,7 +60,7 @@ Windows UI (WinUI)
                .NET Multi-platform App UI (.NET MAUI) -{{'[Syncfusion.SmartTableExtractor.NET.nupkg](https://www.nuget.org/packages/Syncfusion.SmartTableExtractor.NET/)'| markdownify }} +{{'[Syncfusion.SmartTableExtractor.NET.nupkg]'| markdownify }} diff --git a/Document-Processing/DataExtraction/NET/SmartTableExtractor/faq.md b/Document-Processing/DataExtraction/NET/SmartTableExtractor/faq.md index 43cc23835..fd60f2534 100644 --- a/Document-Processing/DataExtraction/NET/SmartTableExtractor/faq.md +++ b/Document-Processing/DataExtraction/NET/SmartTableExtractor/faq.md @@ -1,13 +1,14 @@ --- -title: Extract structured data from PDF and image documents in .NET | Syncfusion -description: Syncfusion® Smart Data Extractor is a .NET library that extracts tables, form fields, text blocks, and images from PDF and image documents, producing PDFs and structured JSON for verification, automation and processing. +title: Extract tables from PDF and image documents in .NET | Syncfusion +description: Syncfusion® Smart Table Extractor detects tables in PDFs, including headers, columns, and merged cells, outputting JSON. platform: document-processing -control: SmartDataExtractor +control: PDF documentation: UG +keywords: Assemblies --- -# Frequently Asked Questions in Blazor SfPdfViewer Component +# Frequently Asked Questions in Smart Table Extractor -Common questions and answers for using the Syncfusion Data Extraction Library. +Common questions and answers for using the Syncfusion Table Extraction. * [How to Resolve the ONNX File Missing Error in Smart Table Extractor?](./FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-table-extractor) diff --git a/Document-Processing/DataExtraction/NET/SmartTableExtractor/overview.md b/Document-Processing/DataExtraction/NET/SmartTableExtractor/overview.md index 676caf54b..4cebbb54c 100644 --- a/Document-Processing/DataExtraction/NET/SmartTableExtractor/overview.md +++ b/Document-Processing/DataExtraction/NET/SmartTableExtractor/overview.md @@ -1,9 +1,10 @@ --- title: Extract tables from PDF and image documents in .NET | Syncfusion -description: Syncfusion® Smart Table Extractor is a .NET library that extracts tabular data from PDF documents. It detects table regions, header rows, columns, cell spans (merged cells), and provides structured JSON. -platform: SmartTableExtractor +description: Syncfusion® Smart Table Extractor detects tables in PDFs, including headers, columns, and merged cells, outputting JSON. +platform: document-processing control: PDF documentation: UG +keywords: Assemblies --- # Overview of SmartTableExtractor diff --git a/Document-Processing/DataExtraction/NET/overview.md b/Document-Processing/DataExtraction/NET/overview.md index be7d8766c..a3755d3d2 100644 --- a/Document-Processing/DataExtraction/NET/overview.md +++ b/Document-Processing/DataExtraction/NET/overview.md @@ -1,14 +1,25 @@ --- -title: Extract structured data from PDF and image documents in .NET | Syncfusion -description: Syncfusion® Smart Data Extractor is a .NET library that extracts tables, form fields, text blocks, and images from PDF and image documents, producing PDFs and structured JSON for verification, automation and processing. +title: Extract structured data from PDF & image Files in .NET | Syncfusion +description: Syncfusion® Smart Data Extractor is a .NET library that extracts tables, forms, text, and images from documents, producing PDFs and JSON. platform: document-processing control: SmartDataExtractor documentation: UG +keywords: Assemblies --- -# Overview of SmartDataExtractor +# Welcome to syncfusion Data Extraction Library -Syncfusion® Smart Data Extractor is a high performance, deterministic C# library that extracts complete document structures from PDFs and images. Designed for .NET workflows, it analyzes visual layout lines, boxes, labels, and alignment to locate and extract elements such as table structure, text elements, images, headers, footers, and form fields with per field confidence scores for immediate review, export, or integration. +Syncfusion® is a high performance, deterministic C# library that extracts complete document structures from PDFs and images. +# List of DataExtraction: + +* PDF Library - is a class library used to create, read, and write PDF files through code in .NET [Windows Forms, WPF, ASP.NET MVC, ASP.NET Core, Blazor, MAUI] and Flutter applications. +* PDF Conversions - is a class library that convert several file formats like HTML, Word, Excel, PowerPoint, and images to PDF documents. It also supports convert PDF to image. +* PDF Viewer - GUI component used to view, edit and print PDF files in Windows Forms, WPF, JavaScript, Angular, React, Vue, ASP.NET MVC, ASP.NET Core, Blazor, MAUI and Flutter applications. +* Smart PDF Viewer – is an AI-enhanced viewer built on top of the PDF Viewer component, offering intelligent features in Blazor applications including document summarization, question answering, smart redact, and smart fill. + +* SmartDataExtractor - analyzes visual layout lines, boxes, labels, and alignment to locate and extract elements such as table structure, text elements, images, headers, footers, and form fields with per-field confidence scores for immediate review, export, or integration. +* SmartTableExtractor - detects table regions, header rows, columns, and cell spans (merged cells) and provides per-cell confidence scores and structured exports ready for downstream processing. +* SmartFormRecognizer - analyzes visual layout cues—lines, boxes and circles—it locates form regions and extracts common controls (text fields, checkboxes, radio buttons, signatures), producing clean JSON with per-field confidence scores. Where form fields are detected, the library can also produce a fillable PDF with corresponding form fields added for immediate use. From 5ba74cbe8c58828d9dafac74afe98228b1c12945 Mon Sep 17 00:00:00 2001 From: venkateshwaransf5013 Date: Mon, 9 Mar 2026 13:30:07 +0530 Subject: [PATCH 10/13] Resolved the CI issue --- ...the-onnx-file-missing-error-in-smart-data-extractor.md} | 0 ...he-onnx-file-missing-error-in-smart-table-extractor.md} | 0 Document-Processing/DataExtraction/NET/overview.md | 7 +------ 3 files changed, 1 insertion(+), 6 deletions(-) rename Document-Processing/DataExtraction/NET/SmartDataExtractor/FAQ/{how-to-resolve-the-onnx-file-missing-error-in-smart-data-extractor => how-to-resolve-the-onnx-file-missing-error-in-smart-data-extractor.md} (100%) rename Document-Processing/DataExtraction/NET/SmartTableExtractor/FAQ/{how-to-resolve-the-onnx-file-missing-error-in-smart-table-extractor => how-to-resolve-the-onnx-file-missing-error-in-smart-table-extractor.md} (100%) diff --git a/Document-Processing/DataExtraction/NET/SmartDataExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-data-extractor b/Document-Processing/DataExtraction/NET/SmartDataExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-data-extractor.md similarity index 100% rename from Document-Processing/DataExtraction/NET/SmartDataExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-data-extractor rename to Document-Processing/DataExtraction/NET/SmartDataExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-data-extractor.md diff --git a/Document-Processing/DataExtraction/NET/SmartTableExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-table-extractor b/Document-Processing/DataExtraction/NET/SmartTableExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-table-extractor.md similarity index 100% rename from Document-Processing/DataExtraction/NET/SmartTableExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-table-extractor rename to Document-Processing/DataExtraction/NET/SmartTableExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-table-extractor.md diff --git a/Document-Processing/DataExtraction/NET/overview.md b/Document-Processing/DataExtraction/NET/overview.md index a3755d3d2..282299f8a 100644 --- a/Document-Processing/DataExtraction/NET/overview.md +++ b/Document-Processing/DataExtraction/NET/overview.md @@ -11,12 +11,7 @@ keywords: Assemblies Syncfusion® is a high performance, deterministic C# library that extracts complete document structures from PDFs and images. -# List of DataExtraction: - -* PDF Library - is a class library used to create, read, and write PDF files through code in .NET [Windows Forms, WPF, ASP.NET MVC, ASP.NET Core, Blazor, MAUI] and Flutter applications. -* PDF Conversions - is a class library that convert several file formats like HTML, Word, Excel, PowerPoint, and images to PDF documents. It also supports convert PDF to image. -* PDF Viewer - GUI component used to view, edit and print PDF files in Windows Forms, WPF, JavaScript, Angular, React, Vue, ASP.NET MVC, ASP.NET Core, Blazor, MAUI and Flutter applications. -* Smart PDF Viewer – is an AI-enhanced viewer built on top of the PDF Viewer component, offering intelligent features in Blazor applications including document summarization, question answering, smart redact, and smart fill. +## List of DataExtraction: * SmartDataExtractor - analyzes visual layout lines, boxes, labels, and alignment to locate and extract elements such as table structure, text elements, images, headers, footers, and form fields with per-field confidence scores for immediate review, export, or integration. * SmartTableExtractor - detects table regions, header rows, columns, and cell spans (merged cells) and provides per-cell confidence scores and structured exports ready for downstream processing. From e5bd21d747261e4dfa390ff513554c2687447234 Mon Sep 17 00:00:00 2001 From: venkateshwaransf5013 Date: Mon, 9 Mar 2026 13:39:44 +0530 Subject: [PATCH 11/13] renamed the platform --- ...the-onnx-file-missing-error-in-smart-table-extractor.md | 7 ++++--- 1 file changed, 4 insertions(+), 3 deletions(-) diff --git a/Document-Processing/DataExtraction/NET/SmartTableExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-table-extractor.md b/Document-Processing/DataExtraction/NET/SmartTableExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-table-extractor.md index a5976520f..69428065f 100644 --- a/Document-Processing/DataExtraction/NET/SmartTableExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-table-extractor.md +++ b/Document-Processing/DataExtraction/NET/SmartTableExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-table-extractor.md @@ -1,9 +1,10 @@ --- title: Extract tables from PDF and image documents in .NET | Syncfusion -description: Syncfusion® Smart Table Extractor is a .NET library that extracts tabular data from PDF documents. It detects table regions, header rows, columns, cell spans (merged cells), and provides structured JSON. -platform: documentProcessing -control: SmartTableExtractor +description: Syncfusion® Smart Table Extractor detects tables in PDFs, including headers, columns, and merged cells, outputting JSON. +platform: document-processing +control: PDF documentation: UG +keywords: Assemblies --- # How to resolve the “ONNX file missing” error in Smart Table Extractor From 583a772c459ccf942343a6fd57fe5216b1a61cdf Mon Sep 17 00:00:00 2001 From: venkateshwaransf5013 Date: Mon, 9 Mar 2026 16:43:55 +0530 Subject: [PATCH 12/13] Changed the folder structure --- Document-Processing-toc.html | 30 +++++++++---------- .../NET}/Assemblies-Required.md | 0 ...e-missing-error-in-smart-data-extractor.md | 0 .../NET}/Features.md | 0 .../NET}/NuGet-Packages-Required.md | 0 .../NET}/faq.md | 0 .../NET}/overview.md | 0 .../NET}/Assemblies-Required.md | 0 ...-missing-error-in-smart-table-extractor.md | 0 .../NET}/Features.md | 0 .../NET}/NuGet-Packages-Required.md | 0 .../NET}/faq.md | 0 .../NET}/overview.md | 0 .../DataExtraction/{NET => }/overview.md | 0 14 files changed, 15 insertions(+), 15 deletions(-) rename Document-Processing/DataExtraction/{NET/SmartDataExtractor => SmartDataExtractor/NET}/Assemblies-Required.md (100%) rename Document-Processing/DataExtraction/{NET/SmartDataExtractor => SmartDataExtractor/NET}/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-data-extractor.md (100%) rename Document-Processing/DataExtraction/{NET/SmartDataExtractor => SmartDataExtractor/NET}/Features.md (100%) rename Document-Processing/DataExtraction/{NET/SmartDataExtractor => SmartDataExtractor/NET}/NuGet-Packages-Required.md (100%) rename Document-Processing/DataExtraction/{NET/SmartDataExtractor => SmartDataExtractor/NET}/faq.md (100%) rename Document-Processing/DataExtraction/{NET/SmartDataExtractor => SmartDataExtractor/NET}/overview.md (100%) rename Document-Processing/DataExtraction/{NET/SmartTableExtractor => SmartTableExtractor/NET}/Assemblies-Required.md (100%) rename Document-Processing/DataExtraction/{NET/SmartTableExtractor => SmartTableExtractor/NET}/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-table-extractor.md (100%) rename Document-Processing/DataExtraction/{NET/SmartTableExtractor => SmartTableExtractor/NET}/Features.md (100%) rename Document-Processing/DataExtraction/{NET/SmartTableExtractor => SmartTableExtractor/NET}/NuGet-Packages-Required.md (100%) rename Document-Processing/DataExtraction/{NET/SmartTableExtractor => SmartTableExtractor/NET}/faq.md (100%) rename Document-Processing/DataExtraction/{NET/SmartTableExtractor => SmartTableExtractor/NET}/overview.md (100%) rename Document-Processing/DataExtraction/{NET => }/overview.md (100%) diff --git a/Document-Processing-toc.html b/Document-Processing-toc.html index 4e633af2f..65600c51f 100644 --- a/Document-Processing-toc.html +++ b/Document-Processing-toc.html @@ -114,28 +114,28 @@ NuGet Packages
              • - DataExtraction + DataExtraction
                • - NET + NET
                  • - DataExtractor + DataExtractor
                    • - TableExtractor + TableExtractor
                      • - Assemblies Required + Assemblies Required
                      • - NuGet Packages Required + NuGet Packages Required
                      • - Features + Features
                      • - FAQ + FAQ
                      • @@ -3201,7 +3201,7 @@
                      • - DataExtraction + DataExtraction
                        • SmartFormRecognizer diff --git a/Document-Processing/DataExtraction/NET/SmartDataExtractor/Assemblies-Required.md b/Document-Processing/DataExtraction/SmartDataExtractor/NET/Assemblies-Required.md similarity index 100% rename from Document-Processing/DataExtraction/NET/SmartDataExtractor/Assemblies-Required.md rename to Document-Processing/DataExtraction/SmartDataExtractor/NET/Assemblies-Required.md diff --git a/Document-Processing/DataExtraction/NET/SmartDataExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-data-extractor.md b/Document-Processing/DataExtraction/SmartDataExtractor/NET/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-data-extractor.md similarity index 100% rename from Document-Processing/DataExtraction/NET/SmartDataExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-data-extractor.md rename to Document-Processing/DataExtraction/SmartDataExtractor/NET/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-data-extractor.md diff --git a/Document-Processing/DataExtraction/NET/SmartDataExtractor/Features.md b/Document-Processing/DataExtraction/SmartDataExtractor/NET/Features.md similarity index 100% rename from Document-Processing/DataExtraction/NET/SmartDataExtractor/Features.md rename to Document-Processing/DataExtraction/SmartDataExtractor/NET/Features.md diff --git a/Document-Processing/DataExtraction/NET/SmartDataExtractor/NuGet-Packages-Required.md b/Document-Processing/DataExtraction/SmartDataExtractor/NET/NuGet-Packages-Required.md similarity index 100% rename from Document-Processing/DataExtraction/NET/SmartDataExtractor/NuGet-Packages-Required.md rename to Document-Processing/DataExtraction/SmartDataExtractor/NET/NuGet-Packages-Required.md diff --git a/Document-Processing/DataExtraction/NET/SmartDataExtractor/faq.md b/Document-Processing/DataExtraction/SmartDataExtractor/NET/faq.md similarity index 100% rename from Document-Processing/DataExtraction/NET/SmartDataExtractor/faq.md rename to Document-Processing/DataExtraction/SmartDataExtractor/NET/faq.md diff --git a/Document-Processing/DataExtraction/NET/SmartDataExtractor/overview.md b/Document-Processing/DataExtraction/SmartDataExtractor/NET/overview.md similarity index 100% rename from Document-Processing/DataExtraction/NET/SmartDataExtractor/overview.md rename to Document-Processing/DataExtraction/SmartDataExtractor/NET/overview.md diff --git a/Document-Processing/DataExtraction/NET/SmartTableExtractor/Assemblies-Required.md b/Document-Processing/DataExtraction/SmartTableExtractor/NET/Assemblies-Required.md similarity index 100% rename from Document-Processing/DataExtraction/NET/SmartTableExtractor/Assemblies-Required.md rename to Document-Processing/DataExtraction/SmartTableExtractor/NET/Assemblies-Required.md diff --git a/Document-Processing/DataExtraction/NET/SmartTableExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-table-extractor.md b/Document-Processing/DataExtraction/SmartTableExtractor/NET/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-table-extractor.md similarity index 100% rename from Document-Processing/DataExtraction/NET/SmartTableExtractor/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-table-extractor.md rename to Document-Processing/DataExtraction/SmartTableExtractor/NET/FAQ/how-to-resolve-the-onnx-file-missing-error-in-smart-table-extractor.md diff --git a/Document-Processing/DataExtraction/NET/SmartTableExtractor/Features.md b/Document-Processing/DataExtraction/SmartTableExtractor/NET/Features.md similarity index 100% rename from Document-Processing/DataExtraction/NET/SmartTableExtractor/Features.md rename to Document-Processing/DataExtraction/SmartTableExtractor/NET/Features.md diff --git a/Document-Processing/DataExtraction/NET/SmartTableExtractor/NuGet-Packages-Required.md b/Document-Processing/DataExtraction/SmartTableExtractor/NET/NuGet-Packages-Required.md similarity index 100% rename from Document-Processing/DataExtraction/NET/SmartTableExtractor/NuGet-Packages-Required.md rename to Document-Processing/DataExtraction/SmartTableExtractor/NET/NuGet-Packages-Required.md diff --git a/Document-Processing/DataExtraction/NET/SmartTableExtractor/faq.md b/Document-Processing/DataExtraction/SmartTableExtractor/NET/faq.md similarity index 100% rename from Document-Processing/DataExtraction/NET/SmartTableExtractor/faq.md rename to Document-Processing/DataExtraction/SmartTableExtractor/NET/faq.md diff --git a/Document-Processing/DataExtraction/NET/SmartTableExtractor/overview.md b/Document-Processing/DataExtraction/SmartTableExtractor/NET/overview.md similarity index 100% rename from Document-Processing/DataExtraction/NET/SmartTableExtractor/overview.md rename to Document-Processing/DataExtraction/SmartTableExtractor/NET/overview.md diff --git a/Document-Processing/DataExtraction/NET/overview.md b/Document-Processing/DataExtraction/overview.md similarity index 100% rename from Document-Processing/DataExtraction/NET/overview.md rename to Document-Processing/DataExtraction/overview.md From 9c8552eed2c711a96345226ce0c0d4e6714a34c4 Mon Sep 17 00:00:00 2001 From: venkateshwaransf5013 Date: Mon, 9 Mar 2026 17:48:07 +0530 Subject: [PATCH 13/13] Addressed the review changes --- .../NET/Assemblies-Required.md | 13 +-- .../SmartDataExtractor/NET/Features.md | 70 +++++++----- .../NET/Assemblies-Required.md | 13 +-- .../SmartTableExtractor/NET/Features.md | 105 +++++++++++++++++- 4 files changed, 156 insertions(+), 45 deletions(-) diff --git a/Document-Processing/DataExtraction/SmartDataExtractor/NET/Assemblies-Required.md b/Document-Processing/DataExtraction/SmartDataExtractor/NET/Assemblies-Required.md index 1a4bd8c5f..4325ed375 100644 --- a/Document-Processing/DataExtraction/SmartDataExtractor/NET/Assemblies-Required.md +++ b/Document-Processing/DataExtraction/SmartDataExtractor/NET/Assemblies-Required.md @@ -19,8 +19,8 @@ The following assemblies need to be referenced in your application based on the - {{'[WPF](https://help.syncfusion.com/document-processing/pdf/pdf-library/net/create-pdf-file-in-wpf)'| markdownify }}, - {{'[Windows Forms](https://help.syncfusion.com/document-processing/pdf/pdf-library/net/create-pdf-file-in-windows-forms)'| markdownify }} and {{'[ASP.NET MVC](https://help.syncfusion.com/document-processing/pdf/pdf-library/net/create-pdf-file-in-asp-net-mvc)'| markdownify }} + {{'[WPF]'| markdownify }}, + {{'[Windows Forms]'| markdownify }} and {{'[ASP.NET MVC]'| markdownify }} Syncfusion.Compression.Base
                          @@ -35,9 +35,9 @@ The following assemblies need to be referenced in your application based on the - {{'[Blazor](https://help.syncfusion.com/document-processing/pdf/pdf-library/net/create-pdf-document-in-blazor)'| markdownify }}, - {{'[.NET Core](https://help.syncfusion.com/document-processing/pdf/pdf-library/net/create-pdf-file-in-asp-net-core)'| markdownify }} - and {{'[.NET Platforms](https://help.syncfusion.com/document-processing/pdf/pdf-library/net/create-pdf-file-in-asp-net-mvc)'| markdownify }} + {{'[Blazor]'| markdownify }}, + {{'[.NET Core]'| markdownify }} + and {{'[.NET Platforms]'| markdownify }} Syncfusion.Compression.Portable
                          @@ -52,8 +52,7 @@ The following assemblies need to be referenced in your application based on the - {{'[Windows UI library (WinUI)](https://help.syncfusion.com/document-processing/pdf/pdf-library/net/create-pdf-file-in-winui)'| markdownify }}, - {{'[.NET Multi-platform App UI (.NET MAUI)](https://help.syncfusion.com/document-processing/pdf/pdf-library/net/create-pdf-file-in-maui)'| markdownify }} + {{'[.NET Multi-platform App UI (.NET MAUI)]'| markdownify }} Syncfusion.Compression.NET
                          diff --git a/Document-Processing/DataExtraction/SmartDataExtractor/NET/Features.md b/Document-Processing/DataExtraction/SmartDataExtractor/NET/Features.md index f6e646354..994ce6d79 100644 --- a/Document-Processing/DataExtraction/SmartDataExtractor/NET/Features.md +++ b/Document-Processing/DataExtraction/SmartDataExtractor/NET/Features.md @@ -83,10 +83,33 @@ using System.IO; using Syncfusion.SmartDataExtractor; using System.Text; -string inputPath = "Image.png"; +//Open the input image file as a stream. +using (FileStream stream = new FileStream("Image.png", FileMode.Open, FileAccess.Read)) +{ + //Initialize the Data Extractor. + DataExtractor extractor = new DataExtractor(); + //Enable form detection in the image document. + extractor.EnableFormDetection = true; + //Enable table detection in the image document. + extractor.EnableTableDetection = true; + //Set confidence threshold for extraction. + extractor.ConfidenceThreshold = 0.6; + //Extract data as JSON from the image stream. + string data = extractor.ExtractDataAsJson(stream); + //Save the extracted JSON data into an output file. + File.WriteAllText("Output.json", data, Encoding.UTF8); +} + +{% endhighlight %} + +{% highlight c# tabtitle="C# [Windows-specific]" %} + +using System.IO; +using Syncfusion.SmartDataExtractor; +using System.Text; //Open the input image file as a stream. -using (FileStream stream = new FileStream(inputPath, FileMode.Open, FileAccess.Read)) +using (FileStream stream = new FileStream("Image.png", FileMode.Open, FileAccess.Read)) { //Initialize the Data Extractor. DataExtractor extractor = new DataExtractor(); @@ -119,16 +142,15 @@ using Syncfusion.SmartDataExtractor; using Syncfusion.SmartFormRecognizer; using System.Text; -string inputPath = "Input.pdf"; - //Open the input PDF file as a stream. -using (FileStream stream = new FileStream(inputPath, FileMode.Open, FileAccess.Read)) +using (FileStream stream = new FileStream("Input.pdf", FileMode.Open, FileAccess.Read)) { //Initialize the Smart Data Extractor. DataExtractor extractor = new DataExtractor(); //Enable form detection in the document. extractor.EnableFormDetection = true; + extractor.EnableTableDetection = false; //Set confidence threshold for extraction. extractor.ConfidenceThreshold = 0.6 //Configure form recognition options. @@ -160,16 +182,15 @@ using Syncfusion.SmartDataExtractor; using Syncfusion.SmartFormRecognizer; using System.Text; -string inputPath = "Input.pdf"; - //Open the input PDF file as a stream. -using (FileStream stream = new FileStream(inputPath, FileMode.Open, FileAccess.Read)) +using (FileStream stream = new FileStream("Input.pdf", FileMode.Open, FileAccess.Read)) { //Initialize the Smart Data Extractor. DataExtractor extractor = new DataExtractor(); //Enable form detection in the document. extractor.EnableFormDetection = true; + extractor.EnableTableDetection = false; //Set confidence threshold for extraction. extractor.ConfidenceThreshold = 0.6 //Configure form recognition options. @@ -209,16 +230,15 @@ using Syncfusion.Pdf.Parsing; using Syncfusion.SmartDataExtractor; using Syncfusion.SmartFormRecognizer; -string inputPath = "Input.pdf"; - //Open the input PDF file as a stream. -using (FileStream stream = new FileStream(inputPath, FileMode.Open, FileAccess.Read)) +using (FileStream stream = new FileStream("Input.pdf", FileMode.Open, FileAccess.Read)) { //Initialize the Smart Data Extractor. DataExtractor extractor = new DataExtractor(); //Enable form detection in the document to identify form fields. extractor.EnableFormDetection = true; + extractor.EnableTableDetection = false; //Apply confidence threshold to extract only reliable data. extractor.ConfidenceThreshold = 0.6; @@ -258,10 +278,8 @@ using Syncfusion.Pdf.Parsing; using Syncfusion.SmartDataExtractor; using Syncfusion.SmartFormRecognizer; -string inputPath = "Input.pdf"; - //Open the input PDF file as a stream. -using (FileStream stream = new FileStream(inputPath, FileMode.Open, FileAccess.Read)) +using (FileStream stream = new FileStream("Input.pdf", FileMode.Open, FileAccess.Read)) { //Initialize the Smart Data Extractor. DataExtractor extractor = new DataExtractor(); @@ -315,14 +333,14 @@ using Syncfusion.SmartDataExtractor; using Syncfusion.SmartTableExtractor; // Load the input PDF file. -string inputPath = "Input.pdf"; -using (FileStream stream = new FileStream(inputPath, FileMode.Open, FileAccess.Read)) +using (FileStream stream = new FileStream("Input.pdf", FileMode.Open, FileAccess.Read)) { // Initialize the Smart Data Extractor. DataExtractor extractor = new DataExtractor(); // Enable table detection and set confidence threshold. extractor.EnableTableDetection = true; + extractor.EnableFormDetection = false; extractor.ConfidenceThreshold = 0.6; // Configure table extraction options. @@ -355,14 +373,14 @@ using Syncfusion.SmartDataExtractor; using Syncfusion.SmartTableExtractor; // Load the input PDF file. -string inputPath = "Input.pdf"; -using (FileStream stream = new FileStream(inputPath, FileMode.Open, FileAccess.Read)) +using (FileStream stream = new FileStream("Input.pdf", FileMode.Open, FileAccess.Read)) { // Initialize the Smart Data Extractor. DataExtractor extractor = new DataExtractor(); // Enable table detection and set confidence threshold. extractor.EnableTableDetection = true; + extractor.EnableFormDetection = false; extractor.ConfidenceThreshold = 0.6; // Configure table extraction options. @@ -401,14 +419,14 @@ using Syncfusion.Pdf.Parsing; using Syncfusion.SmartDataExtractor; // Load the input PDF file. -string inputPath = "Input.pdf"; -using (FileStream stream = new FileStream(inputPath, FileMode.Open, FileAccess.Read)) +using (FileStream stream = new FileStream("Input.pdf", FileMode.Open, FileAccess.Read)) { // Initialize the Smart Data Extractor. DataExtractor extractor = new DataExtractor(); // Apply confidence threshold to extract the data. // Only elements with confidence >= 0.75 will be included in the results. + //default confidence threshold value is 0.6 extractor.ConfidenceThreshold = 0.75; // Extract data and return as a loaded PDF document. PdfLoadedDocument pdf = extractor.ExtractDataAsPdfDocument(stream); @@ -428,14 +446,14 @@ using Syncfusion.Pdf.Parsing; using Syncfusion.SmartDataExtractor; // Load the input PDF file. -string inputPath = "Input.pdf"; -using (FileStream stream = new FileStream(inputPath, FileMode.Open, FileAccess.Read)) +using (FileStream stream = new FileStream("Input.pdf", FileMode.Open, FileAccess.Read)) { // Initialize the Smart Data Extractor. DataExtractor extractor = new DataExtractor(); // Apply confidence threshold to extract the data. // Only elements with confidence >= 0.75 will be included in the results. + //default confidence threshold value is 0.6 extractor.ConfidenceThreshold = 0.75; // Extract data and return as a loaded PDF document. PdfLoadedDocument pdf = extractor.ExtractDataAsPdfDocument(stream); @@ -462,10 +480,8 @@ using System.IO; using Syncfusion.Pdf.Parsing; using Syncfusion.SmartDataExtractor; -string inputPath = "Input.pdf"; - //Open the input PDF file as a stream. -using (FileStream stream = new FileStream(inputPath, FileMode.Open, FileAccess.Read)) +using (FileStream stream = new FileStream("Input.pdf", FileMode.Open, FileAccess.Read)) { //Initialize the Smart Data Extractor. DataExtractor extractor = new DataExtractor(); @@ -491,10 +507,8 @@ using System.IO; using Syncfusion.Pdf.Parsing; using Syncfusion.SmartDataExtractor; -string inputPath = "Input.pdf"; - //Open the input PDF file as a stream. -using (FileStream stream = new FileStream(inputPath, FileMode.Open, FileAccess.Read)) +using (FileStream stream = new FileStream("Input.pdf", FileMode.Open, FileAccess.Read)) { //Initialize the Smart Data Extractor. DataExtractor extractor = new DataExtractor(); diff --git a/Document-Processing/DataExtraction/SmartTableExtractor/NET/Assemblies-Required.md b/Document-Processing/DataExtraction/SmartTableExtractor/NET/Assemblies-Required.md index 1d6964ab3..3fc48ee73 100644 --- a/Document-Processing/DataExtraction/SmartTableExtractor/NET/Assemblies-Required.md +++ b/Document-Processing/DataExtraction/SmartTableExtractor/NET/Assemblies-Required.md @@ -19,8 +19,8 @@ The following assemblies need to be referenced in your application based on the - {{'[WPF](https://help.syncfusion.com/document-processing/pdf/pdf-library/net/create-pdf-file-in-wpf)'| markdownify }}, - {{'[Windows Forms](https://help.syncfusion.com/document-processing/pdf/pdf-library/net/create-pdf-file-in-windows-forms)'| markdownify }} and {{'[ASP.NET MVC](https://help.syncfusion.com/document-processing/pdf/pdf-library/net/create-pdf-file-in-asp-net-mvc)'| markdownify }} + {{'[WPF]'| markdownify }}, + {{'[Windows Forms]'| markdownify }} and {{'[ASP.NET MVC]'| markdownify }} Syncfusion.Compression.Base
                          @@ -32,9 +32,9 @@ The following assemblies need to be referenced in your application based on the - {{'[Blazor](https://help.syncfusion.com/document-processing/pdf/pdf-library/net/create-pdf-document-in-blazor)'| markdownify }}, - {{'[.NET Core](https://help.syncfusion.com/document-processing/pdf/pdf-library/net/create-pdf-file-in-asp-net-core)'| markdownify }} - and {{'[.NET Platforms](https://help.syncfusion.com/document-processing/pdf/pdf-library/net/create-pdf-file-in-asp-net-mvc)'| markdownify }} + {{'[Blazor]'| markdownify }}, + {{'[.NET Core]'| markdownify }} + and {{'[.NET Platforms]'| markdownify }} Syncfusion.Compression.Portable
                          @@ -47,8 +47,7 @@ The following assemblies need to be referenced in your application based on the - {{'[Windows UI library (WinUI)](https://help.syncfusion.com/document-processing/pdf/pdf-library/net/create-pdf-file-in-winui)'| markdownify }}, - {{'[.NET Multi-platform App UI (.NET MAUI)](https://help.syncfusion.com/document-processing/pdf/pdf-library/net/create-pdf-file-in-maui)'| markdownify }} + {{'[.NET Multi-platform App UI (.NET MAUI)]'| markdownify }} Syncfusion.Compression.NET
                          diff --git a/Document-Processing/DataExtraction/SmartTableExtractor/NET/Features.md b/Document-Processing/DataExtraction/SmartTableExtractor/NET/Features.md index be273fbfa..a0df73c20 100644 --- a/Document-Processing/DataExtraction/SmartTableExtractor/NET/Features.md +++ b/Document-Processing/DataExtraction/SmartTableExtractor/NET/Features.md @@ -37,7 +37,34 @@ using (FileStream stream = new FileStream("Input.pdf", FileMode.Open, FileAccess // Extract and save string data = extractor.ExtractTableAsJson(stream); - File.WriteAllText("TableOutput_AllOptions.json", data, Encoding.UTF8); + File.WriteAllText("Output.json", data, Encoding.UTF8); +} + +{% endhighlight %} + +{% highlight c# tabtitle="C# [Windows-specific]" %} + +using System.IO; +using System.Text; +using Syncfusion.SmartTableExtractor; + +//Open the input PDF file as a stream. +using (FileStream stream = new FileStream("Input.pdf", FileMode.Open, FileAccess.Read)) +{ + // Initialize the Smart Table Extractor + TableExtractor extractor = new TableExtractor(); + + // Set all three options together + TableExtractionOptions options = new TableExtractionOptions(); + options.DetectBorderlessTables = true; + options.PageRange = new int[,] { { 1, 5 } }; + options.ConfidenceThreshold = 0.75; + + extractor.TableExtractionOptions = options; + + // Extract and save + string data = extractor.ExtractTableAsJson(stream); + File.WriteAllText("Output.json", data, Encoding.UTF8); } {% endhighlight %} @@ -74,6 +101,30 @@ using (FileStream stream = new FileStream("Input.pdf", FileMode.Open, FileAccess {% endhighlight %} +{% highlight c# tabtitle="C# [Windows-specific]" %} + +using System.IO; +using System.Text; +using Syncfusion.SmartTableExtractor; + +using (FileStream stream = new FileStream("Input.pdf", FileMode.Open, FileAccess.Read)) +{ + // Initialize the Smart Table Extractor + TableExtractor extractor = new TableExtractor(); + + // Set DetectBorderlessTables + TableExtractionOptions options = new TableExtractionOptions(); + options.DetectBorderlessTables = true; + + extractor.TableExtractionOptions = options; + + // Extract and save + string data = extractor.ExtractTableAsJson(stream); + File.WriteAllText("Output.json", data, Encoding.UTF8); +} + +{% endhighlight %} + {% endtabs %} ## Extract Tables Within a Specific Page Range @@ -106,6 +157,30 @@ using (FileStream stream = new FileStream("Input.pdf", FileMode.Open, FileAccess {% endhighlight %} +{% highlight c# tabtitle="C# [Windows-specific]" %} + +using System.IO; +using System.Text; +using Syncfusion.SmartTableExtractor; + +using (FileStream stream = new FileStream("Input.pdf", FileMode.Open, FileAccess.Read)) +{ + // Initialize the Smart Table Extractor + TableExtractor extractor = new TableExtractor(); + + // Set only PageRange + TableExtractionOptions options = new TableExtractionOptions(); + options.PageRange = new int[,] { { 2, 4 } }; + + extractor.TableExtractionOptions = options; + + // Extract and save + string data = extractor.ExtractTableAsJson(stream); + File.WriteAllText("Output.json", data, Encoding.UTF8); +} + +{% endhighlight %} + {% endtabs %} ## Apply confidence threshold to extract the Table @@ -138,6 +213,30 @@ using (FileStream stream = new FileStream("Input.pdf", FileMode.Open, FileAccess {% endhighlight %} +{% highlight c# tabtitle="C# [Windows-specific]" %} + +using System.IO; +using System.Text; +using Syncfusion.SmartTableExtractor; + +using (FileStream stream = new FileStream("Input.pdf", FileMode.Open, FileAccess.Read)) +{ + // Initialize the Smart Table Extractor + TableExtractor extractor = new TableExtractor(); + + // Set ConfidenceThreshold + TableExtractionOptions options = new TableExtractionOptions(); + options.ConfidenceThreshold = 0.6; + + extractor.TableExtractionOptions = options; + + // Extract and save + string data = extractor.ExtractTableAsJson(stream); + File.WriteAllText("Output.json", data, Encoding.UTF8); +} + +{% endhighlight %} + {% endtabs %} ## Extract table data asynchronously from a PDF document @@ -170,7 +269,7 @@ using (FileStream stream = new FileStream("Input.pdf", FileMode.Open, FileAccess string data = await tableExtractor.ExtractTableAsJsonAsync(stream, cts.Token); // Save the extracted data as JSON - File.WriteAllText("TableOutput.json", data, Encoding.UTF8); + File.WriteAllText("Output.json", data, Encoding.UTF8); } @@ -200,7 +299,7 @@ using (FileStream stream = new FileStream("Input.pdf", FileMode.Open, FileAccess string data = await tableExtractor.ExtractTableAsJsonAsync(stream, cts.Token); // Save the extracted data as JSON - File.WriteAllText("TableOutput.json", data, Encoding.UTF8); + File.WriteAllText("Output.json", data, Encoding.UTF8); }