OCR
装完Microsoft Office Document Image后,在项目中分别引用、添加控件:Microsoft Office Document Imaging 11 Type Library,之后分别得到MODI名称空间下的Document、Image等主要操作文档类,以及用于显示文档的AxMODI.AxMiDocView控件;代码关键的有如下部分:
private void SetImage(string filename)
{
// set the
image..
try
{
_MODIDocument = new MODI.Document();
_MODIDocument.Create(filename);
axMiDocView1.Document =
_MODIDocument;
axMiDocView1.Refresh();
}
catch(System.Runtime.InteropServices.COMException ee)
{
MessageBox.Show(ee.Message);
}
}
public void Analyse()
{
if (_MODIDocument == null) return;
try
{
// add event handler for progress visualisation
//_MODIDocument.OnOCRProgress += new
MODI._IDocumentEvents_OnOCRProgressEventHandler(this.ShowProgress);
// the MODI call for OCR
//
_MODIDocument.OCR(_MODIParameters.Language,_MODIParameters.WithAutoRotation,_MODIParameters.WithStraightenImage);
_MODIDocument.OCR(MODI.MiLANGUAGES.miLANG_CHINESE_SIMPLIFIED, true, true);
this.textBox1.Text = (_MODIDocument.Images[0] as
MODI.Image).Layout.Text;
//statusBar1.Text = "Ready.";
_MODIDocument.Close(false);
_MODIDocument = null;
}
catch(Exception ee)
{
// simple exception "handling"
MessageBox.Show(ee.Message);
}
}