Itext7使用及Spire.OCR使用
Itext7使用
using (PdfReader reader = new PdfReader(urlBJ))
{
using (PdfDocument pdfDocument = new PdfDocument(reader))
{
IEventListener strategy = new ImageRenderListener(imageFileName);
PdfCanvasProcessor parser = new PdfCanvasProcessor(strategy);
for (var i = 1; i <= pdfDocument.GetNumberOfPages(); i++)
{
try
{
if (File.Exists(imageFileName))
{
File.Delete(imageFileName);
}
parser.ProcessPageContent(pdfDocument.GetPage(i));
image.Dispose();
}
catch (Exception ex)
{
MessageBox.Show(ex.Message);
}
}
}
}
Spire.OCR使用
Image image = Image.FromFile(imageFileName);
Bitmap bmp = new Bitmap(image);
MemoryStream memoryStream = new MemoryStream();
bmp.Save(memoryStream, System.Drawing.Imaging.ImageFormat.Jpeg);
OcrScanner ocrScanner = new OcrScanner();
System.Diagnostics.Stopwatch stopwatch = System.Diagnostics.Stopwatch.StartNew();
OCRImageFormat imageFormat;
Enum.TryParse(System.Drawing.Imaging.ImageFormat.Jpeg.ToString(), true, out imageFormat);
bool result = ocrScanner.Scan(memoryStream, imageFormat);
if (result)
{
string name = ocrScanner.Text.ToString();
if (ocrScanner.Text.ToString().Contains("图纸名称"))
{
if (string.IsNullOrEmpty(UrlPage))
{
UrlPage = i.ToString()+",";
}
else
{
UrlPage= UrlPage+i.ToString()+",";
}
}
}
image.Dispose();

浙公网安备 33010602011771号