csharp: iTextSharp get Text or Image
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 | using System; using System.Collections.Generic; using System.Linq; using System.Web; using System.Web.UI; using System.Web.UI.WebControls; using System.Drawing; using System.Drawing.Imaging; using System.IO; using System.Text; using iTextSharp.text.pdf; using iTextSharp; using iTextSharp.text.pdf.parser; using Dotnet = System.Drawing.Image; namespace OfficeDoumentWebApp { /// <summary> /// geovindu,Geovin Du, 涂聚文 /// pdf /// </summary> public partial class ItexPDFForm : System.Web.UI.Page { string imgPath= "geovindu" ; /// <summary> /// /// </summary> /// <param name="sender"></param> /// <param name="e"></param> protected void Page_Load( object sender, EventArgs e) { StringBuilder sb = new StringBuilder(); try { if (!IsPostBack) { //Server.MapPath string datafile = DateTime.Now.ToString( "yyyyMMddHHmmssfff" ); string urc = Server.MapPath( "OutFile/" + datafile + "/" ); if (!Directory.Exists(urc)) { Directory.CreateDirectory(urc); } imgPath = urc; string sourcefile = Server.MapPath( "SourceFile/珠宝RFID实施方案.pdf" ); //珠宝RFID实施方案 //if (!Directory.Exists(urc)) // Directory.CreateDirectory(urc); // ItexPDFParser.ExtractImagesFromPDF(Server.MapPath("SourceFile/珠宝RFID实施方案.pdf"), urc); PdfReader pdfReader = new PdfReader(sourcefile); PdfReaderContentParser parser = new PdfReaderContentParser(pdfReader); //ExtRenderListener extRenderListener = new ExtRenderListener(); for ( int pageNumber = 1; pageNumber <= pdfReader.NumberOfPages; pageNumber++) { //PdfReader pdf = new PdfReader(pdfFile); PdfDictionary pg = pdfReader.GetPageN(pageNumber); PdfDictionary res = (PdfDictionary)PdfReader.GetPdfObject(pg.Get(PdfName.RESOURCES)); PdfDictionary xobj = (PdfDictionary)PdfReader.GetPdfObject(res.Get(PdfName.XOBJECT)); //获取文本内容 string tex= PdfTextExtractor.GetTextFromPage(pdfReader, pageNumber); sb.Append(tex); if (! object .Equals(xobj, null )) { foreach (PdfName name in xobj.Keys) { PdfObject obj = xobj.Get(name); if (obj.IsIndirect()) { PdfDictionary tg = (PdfDictionary)PdfReader.GetPdfObject(obj); string width = tg.Get(PdfName.WIDTH).ToString(); string height = tg.Get(PdfName.HEIGHT).ToString(); //TextRenderInfo inf=pdfReader. GraphicsState state = new GraphicsState(); // state= //state = (GraphicsState)(new Matrix(float.Parse(width), float.Parse(height))); ImageRenderInfo imgRI = ImageRenderInfo.CreateForXObject(state, (PRIndirectReference)obj, tg); if (!Object.Equals(imgRI, null )) { RenderImage(imgRI, pageNumber); //图片没有读出 } } } } } } } catch (Exception ex) { Response.Write(ex.Message.ToString()); } Response.Write(sb.ToString()); } /// <summary> /// /// </summary> /// <param name="renderInfo"></param> /// <returns></returns> GraphicsState getGraphicsState(PathPaintingRenderInfo renderInfo) { System.Reflection.FieldInfo gsField = typeof (PathPaintingRenderInfo).GetField( "gs" , System.Reflection.BindingFlags.NonPublic | System.Reflection.BindingFlags.Instance); return (GraphicsState)gsField.GetValue(renderInfo); } /// <summary> /// 提取图片 /// geovindu,Geovin Du /// 涂聚文 /// </summary> /// <param name="renderInfo"></param> private void RenderImage(ImageRenderInfo renderInfo, int number) { PdfImageObject image = renderInfo.GetImage(); using (Dotnet dotnetImg = image.GetDrawingImage()) { if (dotnetImg != null ) { using (MemoryStream ms = new MemoryStream()) { dotnetImg.Save(ms, ImageFormat.Jpeg); //Tiff Bitmap d = new Bitmap(dotnetImg); string f = imgPath + number + ".jpg" ; d.Save(imgPath+number+ ".jpg" ); } } } } } } |
ABCpdf.NET
https://www.nuget.org/packages/ABCpdf
http://test.websupergoo.com/helppdfnet/default.htm?page=source%2f3-concepts%2fg-htmlrender.htm
哲学管理(学)人生, 文学艺术生活, 自动(计算机学)物理(学)工作, 生物(学)化学逆境, 历史(学)测绘(学)时间, 经济(学)数学金钱(理财), 心理(学)医学情绪, 诗词美容情感, 美学建筑(学)家园, 解构建构(分析)整合学习, 智商情商(IQ、EQ)运筹(学)生存.---Geovin Du(涂聚文)
【推荐】国内首个AI IDE,深度理解中文开发场景,立即下载体验Trae
【推荐】编程新体验,更懂你的AI,立即体验豆包MarsCode编程助手
【推荐】抖音旗下AI助手豆包,你的智能百科全书,全免费不限次数
【推荐】轻量又高性能的 SSH 工具 IShell:AI 加持,快人一步
· 25岁的心里话
· 闲置电脑爆改个人服务器(超详细) #公网映射 #Vmware虚拟网络编辑器
· 基于 Docker 搭建 FRP 内网穿透开源项目(很简单哒)
· 零经验选手,Compose 一天开发一款小游戏!
· 一起来玩mcp_server_sqlite,让AI帮你做增删改查!!
2010-09-08 C# 添加用户自定义控件的两种方式