Read Values from Form Fields - VB.NET
PDF Extractor SDK sample in VB.NET demonstrating ‘Read Values from Form Fields’
Program.vb
Imports System.Xml
Imports Bytescout.PDFExtractor
Module Program
Sub Main()
Try
' Create XMLExtractor interface
Using extractor As New XMLExtractor("demo", "demo")
' Load Sample PDF document
extractor.LoadDocumentFromFile("filled_form.pdf")
' Get PDF document text as XML
Dim xmlText As String = extractor.GetXML
' Load XML
Dim xmlDocument As XmlDocument = New XmlDocument
xmlDocument.LoadXml(xmlText)
' Select all "control" nodes
Dim formControls As XmlNodeList = xmlDocument.SelectNodes("//control")
If (Not (formControls) Is Nothing) Then
For Each formControl As XmlNode In formControls
Dim typeAttribute As XmlAttribute = formControl.Attributes("type")
' Get filled textboxes
If (typeAttribute.Value = "editbox") Then
If Not String.IsNullOrEmpty(formControl.InnerText) Then
Console.WriteLine(("EDITBOX " + (formControl.Attributes("id").Value + (": " + formControl.InnerText))))
End If
End If
' Get checked checkboxes
If (typeAttribute.Value = "checkbox") Then
If (formControl.Attributes("state").Value = "1") Then
Console.WriteLine(("CHECKBOX " _
+ (formControl.Attributes("id").Value + (": " + formControl.Attributes("state").Value))))
End If
End If
Next
End If
End Using
Catch ex As Exception
Console.WriteLine(ex.Message)
End Try
Console.WriteLine()
Console.WriteLine("Press any key to exit...")
Console.ReadLine()
End Sub
End Module