11,570 questions
If you want to extract text from PDF, you can use itext7
A basic sample :
PdfReader pdfReader = new PdfReader("e:\\test.pdf");
PdfDocument pdfDoc = new PdfDocument(pdfReader);
for (int nPage = 1; nPage <= pdfDoc.GetNumberOfPages(); nPage++)
{
iText.Kernel.Pdf.Canvas.Parser.Listener.ITextExtractionStrategy extractionStrategy = new iText.Kernel.Pdf.Canvas.Parser.Listener.SimpleTextExtractionStrategy();
string sPageText = iText.Kernel.Pdf.Canvas.Parser.PdfTextExtractor.GetTextFromPage(pdfDoc.GetPage(nPage), extractionStrategy);
Console.WriteLine(string.Format("Page : {0}", nPage.ToString()));
Console.WriteLine(sPageText);
}
pdfDoc.Close();
pdfReader.Close();