最近在做一个项目要求word 中的图片与文字分离 ,找了好久终于找到一个完美的方法

 

c#实现word中的图文分离

 

part 1: class define

 

publicclass WordSeparator:IDisposable
{
#region Constructor
public WordSeparator()
{
WordApp
=new Microsoft.Office.Interop.Word.Application();
}
#endregion

#region Fields
private Microsoft.Office.Interop.Word.Application WordApp;
privateobject missing = System.Reflection.Missing.Value;
privateobject yes =true;
privateobject no =false;
private Microsoft.Office.Interop.Word.Document d;
privateobject filename =@"C:\example.rtf";
#endregion

#region Methods
publicvoid UpdateDoc()
{
d
= WordApp.Documents.Open(ref filename, ref missing, ref no, ref missing,
ref missing, ref missing, ref missing, ref missing, ref missing,
ref missing, ref missing, ref yes, ref missing, ref missing, ref missing, ref missing);
List
<Microsoft.Office.Interop.Word.Range> ranges =
new List<Microsoft.Office.Interop.Word.Range>();
foreach (Microsoft.Office.Interop.Word.InlineShape s in d.InlineShapes)
{
if (s.Type ==
Microsoft.Office.Interop.Word.WdInlineShapeType.wdInlineShapePicture)
{
ranges.Add(s.Range);
s.Delete();
}
}
foreach (Microsoft.Office.Interop.Word.Range r in ranges)
{
r.InlineShapes.AddPicture(
@"c:\PathToNewImage\Image.jpg", ref missing, ref missing, ref missing);
}
WordApp.Quit(
ref yes, ref missing, ref missing);
}
publicvoid SeparateImageText()
{
//初始化程序
d = WordApp.Documents.Open(ref filename, ref missing, ref no, ref missing,
ref missing, ref missing, ref missing, ref missing, ref missing,
ref missing, ref missing, ref yes, ref missing, ref missing, ref missing, ref missing);
List
<Microsoft.Office.Interop.Word.Range> ranges =
new List<Microsoft.Office.Interop.Word.Range>();
List
<string> files =new List<string>();
foreach (Microsoft.Office.Interop.Word.InlineShape s in d.InlineShapes)
{
if (s.Type == Microsoft.Office.Interop.Word.WdInlineShapeType.wdInlineShapePicture
|| s.Type ==
Microsoft.Office.Interop.Word.WdInlineShapeType.wdInlineShapeEmbeddedOLEObject)
{
//获取图片数据
byte[] imgData = (byte[])s.Range.EnhMetaFileBits;
string file =string.Concat(Guid.NewGuid().ToString(), ".gif");
files.Add(file);
//构造图形
MemoryStream mStream =new MemoryStream(imgData);
Bitmap bmp
=new Bitmap(mStream);
//保存到磁盘
bmp.Save(file);
mStream.Dispose();
bmp.Dispose();

ranges.Add(s.Range);
s.Delete();
}
}
for (int i =0; i < ranges.Count; i ++ )
{
Microsoft.Office.Interop.Word.Range r
= ranges[i];
//替换图片
r.InsertBefore("<img src='"+ files[i] +"'>");
r.InsertAfter(
"</img>");
}
//退出程序
WordApp.Quit(ref yes, ref missing, ref missing);
}
///<summary>
/// 替换word中的图片
///</summary>
///<param name="serverPath">图片文件的存储物理路径</param>
///<param name="virtualPath">图片文件的标签虚拟路径</param>
publicvoid SeparateImageText(string serverPath, string virtualPath)
{
//初始化程序
d = WordApp.Documents.Open(ref filename, ref missing, ref no, ref missing,
ref missing, ref missing, ref missing, ref missing, ref missing,
ref missing, ref missing, ref yes, ref missing, ref missing, ref missing, ref missing);
List
<Microsoft.Office.Interop.Word.Range> ranges =new List<Microsoft.Office.Interop.Word.Range>();
List
<string> files =new List<string>();
foreach (Microsoft.Office.Interop.Word.InlineShape s in d.InlineShapes)
{
if (s.Type == Microsoft.Office.Interop.Word.WdInlineShapeType.wdInlineShapePicture
|| s.Type == Microsoft.Office.Interop.Word.WdInlineShapeType.wdInlineShapeEmbeddedOLEObject)
{
//获取图片数据
byte[] imgData = (byte[])s.Range.EnhMetaFileBits;
string file =string.Concat(Guid.NewGuid().ToString(), ".gif");
files.Add(file);
//构造图形
MemoryStream mStream =new MemoryStream(imgData);
Bitmap bmp
=new Bitmap(mStream);
//保存到磁盘
bmp.Save(string.Concat(serverPath, "\\", file));
mStream.Dispose();
bmp.Dispose();

ranges.Add(s.Range);
s.Delete();
}
}
for (int i =0; i < ranges.Count; i++)
{
Microsoft.Office.Interop.Word.Range r
= ranges[i];
//替换图片
r.InsertBefore("<img src='"+string.Concat(virtualPath,"//",files[i]) +"'>");
r.InsertAfter(
"</img>");
}
//退出程序
WordApp.Quit(ref yes, ref missing, ref missing);
}
///<summary>
/// 替换word中的图片
///</summary>
///<param name="targetFile">目标文件</param>
///<param name="serverPath">图片文件的存储物理路径</param>
///<param name="virtualPath">图片文件的标签虚拟路径</param>
publicvoid SeparateImageText(string targetFile,string serverPath, string virtualPath)
{
filename
= targetFile;
//初始化程序
d = WordApp.Documents.Open(ref filename, ref missing, ref no, ref missing,
ref missing, ref missing, ref missing, ref missing, ref missing,
ref missing, ref missing, ref yes, ref missing, ref missing, ref missing, ref missing);
List
<Microsoft.Office.Interop.Word.Range> ranges =new List<Microsoft.Office.Interop.Word.Range>();
List
<string> files =new List<string>();
foreach (Microsoft.Office.Interop.Word.InlineShape s in d.InlineShapes)
{
if (s.Type == Microsoft.Office.Interop.Word.WdInlineShapeType.wdInlineShapePicture
|| s.Type == Microsoft.Office.Interop.Word.WdInlineShapeType.wdInlineShapeEmbeddedOLEObject)
{
//获取图片数据
byte[] imgData = (byte[])s.Range.EnhMetaFileBits;
string file =string.Concat(Guid.NewGuid().ToString(), ".gif");
files.Add(file);
//构造图形
MemoryStream mStream =new MemoryStream(imgData);
Bitmap bmp
=new Bitmap(mStream);
//保存到磁盘
bmp.Save(string.Concat(serverPath, "\\", file));
mStream.Dispose();
bmp.Dispose();

ranges.Add(s.Range);
s.Delete();
}
}
for (int i =0; i < ranges.Count; i++)
{
Microsoft.Office.Interop.Word.Range r
= ranges[i];
//替换图片
r.InsertBefore("<img src='"+string.Concat(virtualPath, "//", files[i]) +"'>");
r.InsertAfter(
"</img>");
}
//退出程序
WordApp.Quit(ref yes, ref missing, ref missing);
}
#endregion

#region IDisposable 成员

publicvoid Dispose()
{
if (d !=null)
{
System.Runtime.InteropServices.Marshal.ReleaseComObject(d);
d
=null;
}
if (WordApp !=null)
{
System.Runtime.InteropServices.Marshal.ReleaseComObject(WordApp);
WordApp
=null;
}
}

#endregion
}

 part 2: usage code:

 

WordSeparator w =new WordSeparator();
w.SeparateImageText();
 
 
 
Shape 对象代表文档中的图形对象,
InlineShape 代表文档中的嵌入式图形对象,
但是我又遇到了另外一种问题,word 中的图片除了InlineShape  的图片外还有  Shape 
 如果将 Shape  转化为  InlineShape  就会报错
 对于shape 还是没法做到完全分离,希望大神指点一二
 
posted @ 2014-11-05 17:14 zhao69222 阅读(571) 评论(0) 推荐(0) 编辑
摘要: 开始-->运行 regedit 进入注册表补充些: 1. gpedit.msc-----组策略 2. sndrec32-------录音机 3. Nslookup-------IP地址侦测器 4. explorer-------打开资源管理器 5. logoff---------注销命令 6. tsshutdn-------60秒倒计时关机命令7. lusrmgr.msc----本机用户和组 8. services.msc---本地服务设置 9. oobe/msoobe /a----检查XP是否激活 10. notepad--------打开记事本 11. cleanmgr--... 阅读全文
posted @ 2013-09-03 21:42 zhao69222 阅读(375) 评论(0) 推荐(0) 编辑
摘要: //获取程序的基目录。 System.AppDomain.CurrentDomain.BaseDirectory//获取模块的完整路径。 System.Diagnostics.Process.GetCurrentProcess().MainModule.FileName//获取和设置当前目录(该进程... 阅读全文
posted @ 2013-06-03 17:15 zhao69222 阅读(163) 评论(0) 推荐(0) 编辑
摘要: 64为操作系统,64位IIS,运行32位应用程序的问题1).32位模式若想要在32位IIS下运行程序,即运行在.netframwork32位下进行如下配置:(1)cscript%systemdrive%\inetpub\adminscripts\adsutil.vbssetw3svc/appPools/enable32bitapponwin641修改IIS配置,允许32位程序运行这个是在C:\Inetpub\AdminScripts\\adsutil.vbs(2)C:\WINDOWS\Microsoft.NET\Framework\v2.0.50727\aspnet_regiis-i为IIS注 阅读全文
posted @ 2012-12-19 15:28 zhao69222 阅读(1176) 评论(4) 推荐(0) 编辑
摘要: IE下设置网页为 首页,收藏 阅读全文
posted @ 2012-11-05 10:33 zhao69222 阅读(196) 评论(0) 推荐(0) 编辑
点击右上角即可分享
微信分享提示