An easy to understand guide on how to remove empty pages from PDF with PDF extractor SDK in C# with this source code sample. ByteScout PDF Suite is the bundle that provides six different SDK libraries to work with PDF from generating rich PDF reports to extracting data from PDF documents and converting them to HTML. This bundle includes PDF (Generator) SDK, PDF Renderer SDK, PDF Extractor SDK, PDF to HTML SDK, PDF Viewer SDK and PDF Generator SDK for Javascript and you can use it to remove empty pages from PDF with PDF extractor SDK with C#.
This prolific sample source code in C# for ByteScout PDF Suite contains various functions and other necessary options you should do calling the API to remove empty pages from PDF with PDF extractor SDK. Just copy and paste the code into your C# application’s code and follow the instructions. Complete and detailed tutorials and documentation are available along with installed ByteScout PDF Suite if you’d like to learn more about the topic and the details of the API.
You can download free trial version of ByteScout PDF Suite from our website to see and try many others source code samples for C#.
On-demand (REST Web API) version:
Web API (on-demand version)
On-premise offline SDK for Windows:
60 Day Free Trial (on-premise)
using System.Collections.Generic;
using System.Diagnostics;
using System.IO;
using Bytescout.PDFExtractor;
namespace RemoveEmptyPagesExample
{
/// <summary>
/// The example demonstrates detection of empty pages, splitting the document to separate
/// pages excluding empty ones, then combine parts back to a single document.
/// </summary>
class Program
{
static string InputFile = @".\sample.pdf";
static string OutputFile = @".\result.pdf";
static string TempFolder = @".\temp";
static void Main(string[] args)
{
// Create and setup Bytescout.PDFExtractor.TextExtractor instance
TextExtractor extractor = new TextExtractor("demo", "demo");
// Load PDF document
extractor.LoadDocumentFromFile(InputFile);
// List to keep non-empty page numbers
List<string> nonEmptyPages = new List<string>();
// Iterate through pages
for (int pageIndex = 0; pageIndex < extractor.GetPageCount(); pageIndex++)
{
// Extract page text
string pageText = extractor.GetTextFromPage(pageIndex);
// If extracted text is not empty keep the page number
if (pageText.Length > 0)
nonEmptyPages.Add((pageIndex + 1).ToString());
}
// Cleanup
extractor.Dispose();
// Form comma-separated list of page numbers to split("1,3,5")
string ranges = string.Join(",", nonEmptyPages);
// Create Bytescout.PDFExtractor.DocumentSplitter instance
DocumentSplitter splitter = new DocumentSplitter("demo", "demo");
splitter.OptimizeSplittedDocuments = true;
// Split document by non-empty in temp folder
string[] parts = splitter.Split(InputFile, ranges, TempFolder);
// Cleanup
splitter.Dispose();
// Create Bytescout.PDFExtractor.DocumentMerger instance
DocumentMerger merger = new DocumentMerger("demo", "demo");
// Merge parts
merger.Merge(parts, OutputFile);
// Cleanup
merger.Dispose();
// Delete temp folder
Directory.Delete(TempFolder, true);
// Open result document in default associated application (for demo purpose)
ProcessStartInfo processStartInfo = new ProcessStartInfo(OutputFile);
processStartInfo.UseShellExecute = true;
Process.Start(processStartInfo);
}
}
}
60 Day Free Trial or Visit ByteScout PDF Suite Home Page
Explore ByteScout PDF Suite Documentation
Explore Samples
Sign Up for ByteScout PDF Suite Online Training
Get Your API Key
Explore Web API Docs
Explore Web API Samples
60 Day Free Trial or Visit ByteScout PDF Suite Home Page
Explore ByteScout PDF Suite Documentation
Explore Samples
Sign Up for ByteScout PDF Suite Online Training
Get Your API Key
Explore Web API Docs
Explore Web API Samples
also available as: