The code displayed below will guide you to install an C# app to remove empty pages from PDF with PDF extractor SDK. ByteScout Data Extraction Suite is the set that includes 3 SDK products for data extraction from PDF, scans, images and from spreadsheets: PDF Extractor SDK, Data Extraction SDK, Barcode Reader SDK. It can remove empty pages from PDF with PDF extractor SDK in C#.
This prolific sample source code in C# for ByteScout Data Extraction Suite contains various functions and other necessary options you should do calling the API to remove empty pages from PDF with PDF extractor SDK. Follow the instructions from scratch to work and copy the C# code. Enjoy writing a code with ready-to-use sample codes in C#.
You can download free trial version of ByteScout Data Extraction Suite from our website with this and other source code samples for C#.
On-demand (REST Web API) version:
Web API (on-demand version)
On-premise offline SDK for Windows:
60 Day Free Trial (on-premise)
using System.Collections.Generic;
using System.Diagnostics;
using System.IO;
using Bytescout.PDFExtractor;
namespace RemoveEmptyPagesExample
{
/// <summary>
/// The example demonstrates detection of empty pages, splitting the document to separate
/// pages excluding empty ones, then combine parts back to a single document.
/// </summary>
class Program
{
static string InputFile = @".\sample.pdf";
static string OutputFile = @".\result.pdf";
static string TempFolder = @".\temp";
static void Main(string[] args)
{
// Create and setup Bytescout.PDFExtractor.TextExtractor instance
TextExtractor extractor = new TextExtractor("demo", "demo");
// Load PDF document
extractor.LoadDocumentFromFile(InputFile);
// List to keep non-empty page numbers
List<string> nonEmptyPages = new List<string>();
// Iterate through pages
for (int pageIndex = 0; pageIndex < extractor.GetPageCount(); pageIndex++)
{
// Extract page text
string pageText = extractor.GetTextFromPage(pageIndex);
// If extracted text is not empty keep the page number
if (pageText.Length > 0)
nonEmptyPages.Add((pageIndex + 1).ToString());
}
// Cleanup
extractor.Dispose();
// Form comma-separated list of page numbers to split("1,3,5")
string ranges = string.Join(",", nonEmptyPages);
// Create Bytescout.PDFExtractor.DocumentSplitter instance
DocumentSplitter splitter = new DocumentSplitter("demo", "demo");
splitter.OptimizeSplittedDocuments = true;
// Split document by non-empty in temp folder
string[] parts = splitter.Split(InputFile, ranges, TempFolder);
// Cleanup
splitter.Dispose();
// Create Bytescout.PDFExtractor.DocumentMerger instance
DocumentMerger merger = new DocumentMerger("demo", "demo");
// Merge parts
merger.Merge(parts, OutputFile);
// Cleanup
merger.Dispose();
// Delete temp folder
Directory.Delete(TempFolder, true);
// Open result document in default associated application (for demo purpose)
ProcessStartInfo processStartInfo = new ProcessStartInfo(OutputFile);
processStartInfo.UseShellExecute = true;
Process.Start(processStartInfo);
}
}
}
60 Day Free Trial or Visit ByteScout Data Extraction Suite Home Page
Explore ByteScout Data Extraction Suite Documentation
Explore Samples
Sign Up for ByteScout Data Extraction Suite Online Training
Get Your API Key
Explore Web API Docs
Explore Web API Samples
60 Day Free Trial or Visit ByteScout Data Extraction Suite Home Page
Explore ByteScout Data Extraction Suite Documentation
Explore Samples
Sign Up for ByteScout Data Extraction Suite Online Training
Get Your API Key
Explore Web API Docs
Explore Web API Samples
also available as: