csharp: iTextSharp get Text or Image

 

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
using System;
using System.Collections.Generic;
using System.Linq;
using System.Web;
using System.Web.UI;
using System.Web.UI.WebControls;
using System.Drawing;
using System.Drawing.Imaging;
using System.IO;
using System.Text;
using iTextSharp.text.pdf;
using iTextSharp;
using iTextSharp.text.pdf.parser;
using Dotnet = System.Drawing.Image;
 
 
namespace OfficeDoumentWebApp
{
 
 
    /// <summary>
    /// geovindu,Geovin Du, 涂聚文
    /// pdf
    /// </summary>
    public partial class ItexPDFForm : System.Web.UI.Page
    {
        string imgPath="geovindu";
        /// <summary>
        ///
        /// </summary>
        /// <param name="sender"></param>
        /// <param name="e"></param>
        protected void Page_Load(object sender, EventArgs e)
        {
            StringBuilder sb = new StringBuilder();          
            try
            {
 
                if(!IsPostBack)
                {
                    //Server.MapPath
                    string datafile = DateTime.Now.ToString("yyyyMMddHHmmssfff");
                    string urc = Server.MapPath("OutFile/" + datafile + "/");
                    if (!Directory.Exists(urc))
                    {
                        Directory.CreateDirectory(urc);
                    }
 
                    imgPath = urc;
                        string sourcefile = Server.MapPath("SourceFile/珠宝RFID实施方案.pdf");  //珠宝RFID实施方案
                        //if (!Directory.Exists(urc))
                        // Directory.CreateDirectory(urc);
                   
                      //  ItexPDFParser.ExtractImagesFromPDF(Server.MapPath("SourceFile/珠宝RFID实施方案.pdf"), urc);
 
                        PdfReader pdfReader = new PdfReader(sourcefile);
                    PdfReaderContentParser parser = new PdfReaderContentParser(pdfReader);
                    //ExtRenderListener extRenderListener = new ExtRenderListener();
 
                    for (int pageNumber = 1; pageNumber <= pdfReader.NumberOfPages; pageNumber++)
                    {
 
                        //PdfReader pdf = new PdfReader(pdfFile);
                        PdfDictionary pg = pdfReader.GetPageN(pageNumber);
                        PdfDictionary res = (PdfDictionary)PdfReader.GetPdfObject(pg.Get(PdfName.RESOURCES));
                        PdfDictionary xobj = (PdfDictionary)PdfReader.GetPdfObject(res.Get(PdfName.XOBJECT));
 
                        //获取文本内容
                      string tex= PdfTextExtractor.GetTextFromPage(pdfReader, pageNumber);
                        sb.Append(tex);
 
                        if (!object.Equals(xobj, null))
                        {
                            foreach (PdfName name in xobj.Keys)
                            {
                                PdfObject obj = xobj.Get(name);
                                if (obj.IsIndirect())
                                {
                                    PdfDictionary tg = (PdfDictionary)PdfReader.GetPdfObject(obj);
                                    string width = tg.Get(PdfName.WIDTH).ToString();
                                    string height = tg.Get(PdfName.HEIGHT).ToString();
                                    //TextRenderInfo inf=pdfReader.
                                    GraphicsState state = new GraphicsState();
                                    // state=
                                    //state = (GraphicsState)(new Matrix(float.Parse(width), float.Parse(height)));
                                    ImageRenderInfo imgRI = ImageRenderInfo.CreateForXObject(state, (PRIndirectReference)obj, tg);
                                    if (!Object.Equals(imgRI, null))
                                    {
                                        RenderImage(imgRI, pageNumber); //图片没有读出
                                    }
 
 
                                }
                            }
                        }
                    }
                    
 
 
 
                 }
 
            }
            catch(Exception ex)
            {
                Response.Write(ex.Message.ToString());
 
            }
            Response.Write(sb.ToString());
        }
        /// <summary>
        ///
        /// </summary>
        /// <param name="renderInfo"></param>
        /// <returns></returns>
        GraphicsState getGraphicsState(PathPaintingRenderInfo renderInfo)
        {
            System.Reflection.FieldInfo gsField = typeof(PathPaintingRenderInfo).GetField("gs", System.Reflection.BindingFlags.NonPublic | System.Reflection.BindingFlags.Instance);
            return (GraphicsState)gsField.GetValue(renderInfo);
        }
 
 
        /// <summary>
        /// 提取图片
        /// geovindu,Geovin Du
        /// 涂聚文
        /// </summary>
        /// <param name="renderInfo"></param>
 
        private void RenderImage(ImageRenderInfo renderInfo,int number)
        {
            PdfImageObject image = renderInfo.GetImage();
            using (Dotnet dotnetImg = image.GetDrawingImage())
            {
                if (dotnetImg != null)
                {
                    using (MemoryStream ms = new MemoryStream())
                    {
                        dotnetImg.Save(ms, ImageFormat.Jpeg); //Tiff
                        Bitmap d = new Bitmap(dotnetImg);
                        string f = imgPath + number + ".jpg";
                        d.Save(imgPath+number+".jpg");
                    }
                }
            }
        }
 
 
    }
}

  

 

 

ABCpdf.NET
https://www.nuget.org/packages/ABCpdf
http://test.websupergoo.com/helppdfnet/default.htm?page=source%2f3-concepts%2fg-htmlrender.htm

posted @   ®Geovin Du Dream Park™  阅读(71)  评论(0编辑  收藏  举报
相关博文:
阅读排行:
· 25岁的心里话
· 闲置电脑爆改个人服务器(超详细) #公网映射 #Vmware虚拟网络编辑器
· 基于 Docker 搭建 FRP 内网穿透开源项目(很简单哒)
· 零经验选手,Compose 一天开发一款小游戏!
· 一起来玩mcp_server_sqlite,让AI帮你做增删改查!!
历史上的今天:
2010-09-08 C# 添加用户自定义控件的两种方式
< 2025年3月 >
23 24 25 26 27 28 1
2 3 4 5 6 7 8
9 10 11 12 13 14 15
16 17 18 19 20 21 22
23 24 25 26 27 28 29
30 31 1 2 3 4 5
点击右上角即可分享
微信分享提示