转:C# PDFbox读取PDF内容

using System;
using System.Windows.Forms;
using org.apache.pdfbox.pdmodel;
using org.apache.pdfbox.util;
using System.IO;
 
 
namespace ReadPDF
{
    public partial class Form2 : Form
    {
        public Form2()
        {
            InitializeComponent();
        }
 
        public static void pdf2txt(FileInfo pdffile)
        {
            PDDocument doc = PDDocument.load(pdffile.FullName);
            PDFTextStripper pdfStripper = new PDFTextStripper();
            string text = pdfStripper.getText(doc);
        }
 
        private void button1_Click(object sender, EventArgs e)
        {
            pdf2txt(new FileInfo(@"e:/5.pdf"));
        }
    }
}

 

 

原文:https://blog.csdn.net/wk125570/article/details/75099051?utm_source=copy

posted @ 2018-10-12 09:22  chu_叶子  阅读(2604)  评论(0编辑  收藏  举报