Convert PDF To HTML (Simple Layout) From Page - C#
PDF To HTML SDK sample in C# demonstrating ‘Convert PDF To HTML (Simple Layout) From Page’
Program.cs
using System;
using System.Diagnostics;
using Bytescout.PDF2HTML;
namespace ExtractHTMLFromPage
{
class Program
{
static void Main(string[] args)
{
// Create Bytescout.PDF2HTML.HTMLExtractor instance
HTMLExtractor extractor = new HTMLExtractor();
extractor.RegistrationName = "demo";
extractor.RegistrationKey = "demo";
// Set plain HTML extraction mode
extractor.ExtractionMode = HTMLExtractionMode.PlainHTML;
// Load sample PDF document
extractor.LoadDocumentFromFile("sample2.pdf");
// Convert 2-nd page to HTML and save it to file
extractor.SaveHtmlPageToFile(1, "output.html");
// Cleanup
extractor.Dispose();
// Open result document in default associated application (for demo purpose)
ProcessStartInfo processStartInfo = new ProcessStartInfo("output.html");
processStartInfo.UseShellExecute = true;
Process.Start(processStartInfo);
}
}
}