These sample source codes can be used to convert a PDF file to CSV by pages in C#, VB.NET and VBScript using ByteScout PDF Extractor SDK.
Select your programming language:
using System; using System.Collections.Generic; using System.Text; using Bytescout.PDFExtractor; using System.Diagnostics; namespace ConsoleApplication1 { class Program { static void Main(string[] args) { // Create Bytescout.PDFExtractor.CSVExtractor instance CSVExtractor extractor = new CSVExtractor(); extractor.RegistrationName = "demo"; extractor.RegistrationKey = "demo"; // Load sample PDF document extractor.LoadDocumentFromFile("sample3.pdf"); //extractor.CSVSeparatorSymbol = ","; // you can change CSV separator symbol (if needed) from "," symbol to another if needed for non-US locales // Get page count int pageCount = extractor.GetPageCount(); for (int i = 0; i < pageCount; i++) { string fileName = "page" + i + ".csv"; // Save extracted page text to file extractor.SavePageCSVToFile(i, fileName); } Console.WriteLine(); Console.WriteLine("Data has been extracted to separate files for pages."); Console.WriteLine(); Console.WriteLine("Press any key to continue..."); Console.ReadKey(); //Process.Start("page0.csv"); } } }
Imports System Imports System.Collections.Generic Imports System.Text Imports Bytescout.PDFExtractor Imports System.Diagnostics Namespace ConsoleApplication1 Class Program Shared Sub Main(ByVal args As String()) ' Create Bytescout.PDFExtractor.CSVExtractor instance Dim extractor As New CSVExtractor() extractor.RegistrationName = "demo" extractor.RegistrationKey = "demo" ' Load sample PDF document extractor.LoadDocumentFromFile("sample3.pdf") 'extractor.CSVSeparatorSymbol = "," // you can change CSV separator symbol (if needed) from "," symbol to another if needed for non-US locales ' Get page count Dim pageCount As Integer = extractor.GetPageCount() For i As Integer = 0 To pageCount - 1 Dim fileName As String = "page" & i & ".csv" ' Save extracted page text to file extractor.SavePageCSVToFile(i, fileName) Next Console.WriteLine() Console.WriteLine("Press any key to continue and open CSV in default CSV viewer (or Excel)...") Console.ReadKey() Process.Start("page0.csv") End Sub End Class End Namespace
' Create Bytescout.PDFExtractor.CSVExtractor object Set extractor = CreateObject("Bytescout.PDFExtractor.CSVExtractor") extractor.RegistrationName = "demo" extractor.RegistrationKey = "demo" ' Load sample PDF document extractor.LoadDocumentFromFile "../../sample3.pdf" 'extractor.CSVSeparatorSymbol = "," ' you can change CSV separator symbol (if needed) from "," symbol to another if needed for non-US locales ' Get page count pageCount = extractor.GetPageCount() For i = 0 To pageCount - 1 fileName = "page" & i & ".csv" ' Save extracted page text to file extractor.SavePageCSVToFile i, fileName Next MsgBox "Data has been extracted to 'page0.csv' and other files."