Free Trial
Web API version
Licensing
Request A Quote
HAVE QUESTIONS OR NEED HELP? SUBMIT THE SUPPORT REQUEST FORM or write email to SUPPORT@BYTESCOUT.COM
Repair Text in PDF | C#
Program.cs:
C#
using Bytescout.PDFExtractor; using System; namespace RepairText { class Program { static void Main(string[] args) { try { //Read all text from pdf file using (TextExtractor extractor = new TextExtractor()) { // Load PDF document extractor.LoadDocumentFromFile("sample.pdf"); // Set the font repairing OCR mode extractor.OCRMode = OCRMode.TextFromImagesAndVectorsAndRepairedFonts; // Set the location of OCR language data files extractor.OCRLanguageDataFolder = @"c:\Program Files\Bytescout PDF Extractor SDK\ocrdata_best\"; // Set OCR language extractor.OCRLanguage = "eng"; // "eng" for english, "deu" for German, "fra" for French, "spa" for Spanish etc - according to files in "ocrdata" folder // Find more language files at https://github.com/bytescout/ocrdata // Set PDF document rendering resolution extractor.OCRResolution = 300; //Read all text string allText = extractor.GetText(); Console.WriteLine("Extracted Text: \n\n" + allText); } } catch (Exception ex) { Console.WriteLine(ex.Message); } Console.ReadLine(); } } }