this is the code, I m write. so sorry truly I m a newbie in coding. I m ready to find out the number of the PDF file page that appear word"Revenue". After this to print out on the CMD. Could anyone help me? thank a lot.
using System;
using System.Collections.Generic;
using System.Linq;
using System.Text;
using System.Threading.Tasks;
using iTextSharp.text.pdf;
using iTextSharp.text.pdf.parser;
namespace pdf26052021
{
class Program
{
static void Main(string[] args)
{
PFD PATH = new PFD();
List<int> x = new List<int>( PATH.ReadPdfFile(@"C:\Users\fengs\Desktop\pdf", "test.pdf", "Revenue"));
Console.WriteLine(x);
Console.ReadLine();
}
}
class PFD
{
public List<int> ReadPdfFile(string path,string fileName, String searthText)
{
List<int> pages = new List<int>();
if (System.IO.File.Exists(path + @"\" + fileName))
{
PdfReader pdfReader = new PdfReader(path + @"\" + fileName);
for (int page = 1; page <= pdfReader.NumberOfPages; page++)
{
ITextExtractionStrategy strategy = new SimpleTextExtractionStrategy();
string currentPageText = PdfTextExtractor.GetTextFromPage(pdfReader, page, strategy);
if (currentPageText.Contains(searthText))
{
pages.Add(page);
}
}
pdfReader.Close();
}
return pages;
}
}
}
thank you