Program.cs
using System;
using System.Xml;
using Bytescout.PDFExtractor;
namespace ReadValuesFromFormFields
{
class Program
{
static void Main(string[] args)
{
try
{
// Create XMLExtractor interface
using (XMLExtractor extractor = new XMLExtractor("demo", "demo"))
{
// Load Sample PDF document
extractor.LoadDocumentFromFile("filled_form.pdf");
// Get PDF document text as XML
string xmlText = extractor.GetXML();
// Load XML
XmlDocument xmlDocument = new XmlDocument();
xmlDocument.LoadXml(xmlText);
// Select all "control" nodes
XmlNodeList formControls = xmlDocument.SelectNodes("//control");
if (formControls != null)
{
foreach (XmlNode formControl in formControls)
{
XmlAttribute typeAttribute = formControl.Attributes["type"];
// Get filled textboxes
if (typeAttribute.Value == "editbox")
{
if (!string.IsNullOrEmpty(formControl.InnerText))
{
Console.WriteLine("EDITBOX " + formControl.Attributes["id"].Value + ": " + formControl.InnerText);
}
}
// Get checked checkboxes
else if (typeAttribute.Value == "checkbox")
{
if (formControl.Attributes["state"].Value == "1")
{
Console.WriteLine("CHECKBOX " + formControl.Attributes["id"].Value + ": " + formControl.Attributes["state"].Value);
}
}
}
}
}
}
catch (Exception ex)
{
Console.WriteLine(ex.Message);
}
Console.WriteLine();
Console.WriteLine("Press any key to exit...");
Console.ReadLine();
}
}
}
Click here to get your Free Trial version of the SDK
also available as: