Convert PDF To HTML From URL | VB.NETByteScout PDF To HTML SDK

Convert PDF To HTML From URL | VB.NET

Module1.vb:

VB
Imports System.IO
Imports System.Net
Imports Newtonsoft.Json
Imports Newtonsoft.Json.Linq

Module Module1

    ' The authentication key (API Key).
    ' Get your own by registering at https://app.pdf.co
    Const API_KEY As String = "***********************************"

    ' Direct URL of source PDF file.
    ' You can also upload your own file into PDF.co and use it as url. Check "Upload File" samples for code snippets: https://github.com/bytescout/pdf-co-api-samples/tree/master/File%20Upload/   
    Const SourceFileUrl As String = "https://bytescout-com.s3.amazonaws.com/files/demo-files/cloud-api/pdf-to-html/sample.pdf"
    ' Comma-separated list of page indices (or ranges) to process. Leave empty for all pages. Example: '0,2-5,7-'.
    const Pages as String = ""
    ' PDF document password. Leave empty for unprotected documents.
    const Password As String = ""
    ' Destination HTML file name
    const DestinationFile as String = ".\result.html"
    ' Set to `true` to get simplified HTML without CSS. Default is the rich HTML keeping the document design.
    const PlainHtml as Boolean = False
    ' Set to `true` if your document has the column layout like a newspaper.
    const ColumnLayout as Boolean = False

    Sub Main()

        ' Create standard .NET web client instance
        Dim webClient As WebClient = New WebClient()

        ' Set API Key
        webClient.Headers.Add("x-api-key", API_KEY)

        ' Set JSON content type
        webClient.Headers.Add("Content-Type", "application/json")

        ' Prepare URL for `PDF To HTML` API call
        Dim url As String = "https://api.pdf.co/v1/pdf/convert/to/html"

        ' Prepare requests params as JSON
        ' See documentation: https : //apidocs.pdf.co
        Dim parameters As New Dictionary(Of String, Object)
        parameters.Add("name", Path.GetFileName(DestinationFile))
        parameters.Add("password", Password)
        parameters.Add("pages", Pages)
        parameters.Add("simple", PlainHtml)
        parameters.Add("columns", ColumnLayout)
        parameters.Add("url", SourceFileUrl)

        ' Convert dictionary of params to JSON
        Dim jsonPayload As String = JsonConvert.SerializeObject(parameters)

        Try
            ' Execute POST request with JSON payload
            Dim response As String = webClient.UploadString(url, jsonPayload)

            ' Parse JSON response
            Dim json As JObject = JObject.Parse(response)

            If json("error").ToObject(Of Boolean) = False Then

                ' Get URL of generated HTML file
                Dim resultFileUrl As String = json("url").ToString()

                ' Download HTML file
                webClient.DownloadFile(resultFileUrl, DestinationFile)

                Console.WriteLine("Generated HTML file saved as ""{0}"" file.", DestinationFile)

            Else
                Console.WriteLine(json("message").ToString())
            End If

        Catch ex As WebException
            Console.WriteLine(ex.ToString())
        End Try

        webClient.Dispose()


        Console.WriteLine()
        Console.WriteLine("Press any key...")
        Console.ReadKey()

    End Sub

End Module