PDF To XML With Images - VB.NET
PDF Extractor SDK sample in VB.NET demonstrating ‘PDF To XML With Images’
Module1.vb
Imports Bytescout.PDFExtractor
Namespace PDF2XML
Class Program
Shared Sub Main(ByVal args As String())
' Create Bytescout.PDFExtractor.XMLExtractor instance
Dim extractor As New XMLExtractor()
extractor.RegistrationName = "demo"
extractor.RegistrationKey = "demo"
' Load sample PDF document
extractor.LoadDocumentFromFile("sample1.pdf")
' Uncomment this line to get rid of empty nodes in XML
'extractor.PreserveFormattingOnTextExtraction = False
' Set output image format
extractor.ImageFormat = OutputImageFormat.PNG
' Save images to external files
extractor.SaveImages = ImageHandling.OuterFile
extractor.ImageFolder = "images" ' Folder for external images
extractor.SaveXMLToFile("result_with_external_images.xml")
' Embed images into XML as Base64 encoded string
extractor.SaveImages = ImageHandling.Embed
extractor.SaveXMLToFile("result_with_embedded_images.xml")
' Cleanup
extractor.Dispose()
End Sub
End Class
End Namespace
Resources.Designer.vb
��' - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
' <