Cloud API - PDF To Text - C# - Convert PDF To Text From URL Asynchronously - ByteScout
Announcement
Our ByteScout SDK products are sunsetting as we focus on expanding new solutions.
Learn More Open modal
Close modal
Announcement Important Update
ByteScout SDK Sunsetting Notice
Our ByteScout SDK products are sunsetting as we focus on our new & improved solutions. Thank you for being part of our journey, and we look forward to supporting you in this next chapter!

Cloud API – PDF To Text – C# – Convert PDF To Text From URL Asynchronously

  • Home
  • /
  • Articles
  • /
  • Cloud API – PDF To Text – C# – Convert PDF To Text From URL Asynchronously

Cloud API – PDF To Text – C# – Convert PDF To Text From URL Asynchronously

Program.cs

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
using System;
using System.IO;
using System.Net;
using System.Threading;
using Newtonsoft.Json.Linq;
 
// Cloud API asynchronous "PDF To Text" job example.
// Allows to avoid timeout errors when processing huge or scanned PDF documents.
 
namespace ByteScoutWebApiExample
{
    class Program
    {
        // (!) If you are getting '(403) Forbidden' error please ensure you have set the correct API_KEY
         
        // The authentication key (API Key).
        // Get your own by registering at https://secure.bytescout.com/users/sign_up
        const String API_KEY = "***********************************";
         
        // Direct URL of source PDF file.
        // Comma-separated list of page indices (or ranges) to process. Leave empty for all pages. Example: '0,2-5,7-'.
        const string Pages = "";
        // PDF document password. Leave empty for unprotected documents.
        const string Password = "";
        // Destination TXT file name
        const string DestinationFile = @".\result.txt";
        // (!) Make asynchronous job
        const bool Async = true;
 
 
        static void Main(string[] args)
        {
            // Create standard .NET web client instance
            WebClient webClient = new WebClient();
 
            // Set API Key
            webClient.Headers.Add("x-api-key", API_KEY);
 
            // Prepare URL for `PDF To Text` API call
            string query = Uri.EscapeUriString(string.Format(
                "https://api.pdf.co/v1/pdf/convert/to/text?name={0}&password={1}&pages={2}&url={3}&async={4}",
                Path.GetFileName(DestinationFile),
                Password,
                Pages,
                SourceFileUrl,
                Async));
 
            try
            {
                // Execute request
                string response = webClient.DownloadString(query);
 
                // Parse JSON response
                JObject json = JObject.Parse(response);
 
                if (json["error"].ToObject<bool>() == false)
                {
                    // Asynchronous job ID
                    string jobId = json["jobId"].ToString();
                    // URL of generated TXT file that will be available after the job completion
                    string resultFileUrl = json["url"].ToString();
 
                    // Check the job status in a loop.
                    // If you don't want to pause the main thread you can rework the code
                    // to use a separate thread for the status checking and completion.
                    do
                    {
                        string status = CheckJobStatus(jobId); // Possible statuses: "InProgress", "Failed", "Aborted", "Finished".
 
                        // Display timestamp and status (for demo purposes)
                        Console.WriteLine(DateTime.Now.ToLongTimeString() + ": " + status);
 
                        if (status == "Finished")
                        {
                            // Download TXT file
                            webClient.DownloadFile(resultFileUrl, DestinationFile);
 
                            Console.WriteLine("Generated TXT file saved as \"{0}\" file.", DestinationFile);
                            break;
                        }
                        else if (status == "InProgress")
                        {
                            // Pause for a few seconds
                            Thread.Sleep(3000);
                        }
                        else
                        {
                            Console.WriteLine(status);
                            break;
                        }
                    }
                    while (true);
                }
                else
                {
                    Console.WriteLine(json["message"].ToString());
                }
            }
            catch (WebException e)
            {
                Console.WriteLine(e.ToString());
            }
 
            webClient.Dispose();
 
 
            Console.WriteLine();
            Console.WriteLine("Press any key...");
            Console.ReadKey();
        }
 
        static string CheckJobStatus(string jobId)
        {
            using (WebClient webClient = new WebClient())
            {
                string url = "https://api.pdf.co/v1/job/check?jobid=" + jobId;
 
                string response = webClient.DownloadString(url);
                JObject json = JObject.Parse(response);
 
                return Convert.ToString(json["Status"]);
            }
        }
    }
}

  Click here to get your Free Trial version of the SDK

Tutorials:

prev
next