Default.aspx.cs
using System;
using Bytescout.PDF2HTML;
namespace ExtractHTML
{
public partial class _Default : System.Web.UI.Page
{
protected void Page_Load(object sender, EventArgs e)
{
// This test file will be copied to the project directory on the pre-build event (see the project properties).
String inputFile = Server.MapPath(@".\bin\sample2.pdf");
// Create Bytescout.PDF2HTML.HTMLExtractor instance
HTMLExtractor extractor = new HTMLExtractor();
extractor.RegistrationName = "demo";
extractor.RegistrationKey = "demo";
// Set HTML with CSS extraction mode
extractor.ExtractionMode = HTMLExtractionMode.HTMLWithCSS;
// Embed images into HTML file
extractor.SaveImages = ImageHandling.Embed;
// Load sample PDF document
extractor.LoadDocumentFromFile(inputFile);
Response.Clear();
Response.ContentType = "text/html";
// Save extracted text to output stream
extractor.SaveHtmlToStream(Response.OutputStream);
Response.End();
extractor.Dispose();
}
}
}
Web.config
<?xml version="1.0"?>
<configuration>
<appSettings/>
<connectionStrings/>
<system.web>
<!--
Set compilation debug="true" to insert debugging
symbols into the compiled page. Because this
affects performance, set this value to true only
during development.
-->
<compilation debug="true" />
<!--
The <authentication> section enables configuration
of the security authentication mode used by
ASP.NET to identify an incoming user.
-->
<authentication mode="Windows" />
<!--
The <customErrors> section enables configuration
of what to do if/when an unhandled error occurs
during the execution of a request. Specifically,
it enables developers to configure html error pages
to be displayed in place of a error stack trace.
<customErrors mode="RemoteOnly" defaultRedirect="GenericErrorPage.htm">
<error statusCode="403" redirect="NoAccess.htm" />
<error statusCode="404" redirect="FileNotFound.htm" />
</customErrors>
-->
</system.web>
</configuration>