Chinese Simplified (简体中文)

English (English)

字段别识别

Note: Some parts of this article may be in English. We apologize for the inconvenience and are working on adding the translation as soon as possible.

进行字段级识别时，会识别短文本片段以捕捉某些字段的数据。识别质量在此场景中至关重要。

此场景也可用作更复杂场景的组成部分，这些场景需要从文档中提取有意义的数据（例如，为了将数据从纸质文档捕获到信息系统和数据库中，或者为了在文档管理系统中自动进行文档分类和索引）。

在此场景中，系统要么只识别部分字段中的几行文本，要么识别一个小图像上的整个文本。系统会计算出识别的每个字符的确定性评分。然后，在检查识别结果时可以使用确定性评分。此外，系统可以存储文本中词语和字符的多个识别变体，然后可在投票算法中使用它们改善识别质量。

此场景中的小文本片段处理在一些方面不同于其他场景中的相同步骤：

对扫描的图像或照片进行预处理

要识别的图像可能包含标记和背景噪声，两者都有可能妨碍识别。为此，会在这一步去除所有不需要的标记和背景噪声。

小文本片段识别

识别小文本片段时会事先知道要识别的数据类型。因此，可以通过使用外部字典、正则表达式、自定义识别语言和字母表，以及对字符串中的字符数量进行限制来改善识别质量。文本字段可能会同时包含印刷文本和手写文本。

处理已识别的数据

此场景要求达到最高的识别准确度，以便将数据校验工作保持在最低水平。系统可以计算出每个已识别的词语或字符的确定性评分并提供多个识别变体，然后多个引擎可以应用投票算法从中选择最佳候选对象。

场景实现

下面详细介绍了在此场景中使用 ABBYY FineReader Engine 12 的推荐方法。建议方法中采用了被认为最适合此场景的处理设置。

第1步加载 ABBYY FineReader Engine

要开始使用 ABBYY FineReader Engine，您需要创建 Engine 对象。Engine 对象是 ABBYY FineReader Engine 对象层次体系中的顶级对象，提供各种全局设置、一些处理方法和用于创建其它对象的方法。

要创建 Engine 对象，您可以使用 InitializeEngine 导出的函数。另请加载 Engine 对象的不同方式。

C#

public class EngineLoader : IDisposable
{
    public EngineLoader()
    {
        // 用 FREngine.dll 的完整路径、客户项目 ID，
        // 以及（如适用）您的在线许可证令牌文件路径和在线许可证密码初始化这些变量
        string enginePath = "";
        string customerProjectId = "";
        string licensePath = "";
        string licensePassword = "";
        // 加载 FREngine.dll 库
        dllHandle = LoadLibraryEx(enginePath, IntPtr.Zero, LOAD_WITH_ALTERED_SEARCH_PATH);
           
        try
        {
            if (dllHandle == IntPtr.Zero)
            {
                throw new Exception("无法加载" + enginePath);
            }
            IntPtr initializeEnginePtr = GetProcAddress(dllHandle, "InitializeEngine");
            if (initializeEnginePtr == IntPtr.Zero)
            {
                throw new  Exception("无法找到 InitializeEngine 函数");
            }
            IntPtr deinitializeEnginePtr = GetProcAddress(dllHandle, "DeinitializeEngine");
            if (deinitializeEnginePtr == IntPtr.Zero)
            {
                throw new Exception("无法找到 DeinitializeEngine 函数");
            }
            IntPtr dllCanUnloadNowPtr = GetProcAddress(dllHandle, "DllCanUnloadNow");
            if (dllCanUnloadNowPtr == IntPtr.Zero)
            {
                throw new Exception("无法找到 DllCanUnloadNow 函数");
            }
            // 转换指针为代理
            initializeEngine = (InitializeEngine)Marshal.GetDelegateForFunctionPointer(
                initializeEnginePtr, typeof(InitializeEngine));
            deinitializeEngine = (DeinitializeEngine)Marshal.GetDelegateForFunctionPointer(
                deinitializeEnginePtr, typeof(DeinitializeEngine));
            dllCanUnloadNow = (DllCanUnloadNow)Marshal.GetDelegateForFunctionPointer(
                dllCanUnloadNowPtr, typeof(DllCanUnloadNow));
            // 调用 InitializeEngine 函数
            // 传递路径到在线许可证文件路径和在线许可证密码
            int hresult = initializeEngine(customerProjectId, licensePath, licensePassword, 
                "", "", false, ref engine);
            Marshal.ThrowExceptionForHR(hresult);
        }
        catch (Exception)
        {
            // 释放 FREngine.dll 库
            engine = null;
            // FreeLibrary 调用前删除所有对象
            GC.Collect();
            GC.WaitForPendingFinalizers();
            GC.Collect();
            FreeLibrary(dllHandle);
            dllHandle = IntPtr.Zero;
            initializeEngine = null;
            deinitializeEngine = null;
            dllCanUnloadNow = null;
            throw;
        }
    }
    // Kernel32.dll 函数
    [DllImport("kernel32.dll")]
    private static extern IntPtr LoadLibraryEx(string dllToLoad, IntPtr reserved, uint flags);
    private const uint LOAD_WITH_ALTERED_SEARCH_PATH = 0x00000008;
    [DllImport("kernel32.dll")]
    private static extern IntPtr GetProcAddress(IntPtr hModule, string procedureName);
    [DllImport("kernel32.dll")]
    private static extern bool FreeLibrary(IntPtr hModule);
    // FREngine.dll 函数 
    [UnmanagedFunctionPointer(CallingConvention.StdCall, CharSet = CharSet.Unicode)]
    private delegate int InitializeEngine(string customerProjectId, string licensePath, 
        string licensePassword, string tempFolder, string dataFolder, bool isSharedCPUCoresMode, 
        ref FREngine.IEngine engine);
    [UnmanagedFunctionPointer(CallingConvention.StdCall)]
    private delegate int DeinitializeEngine();
    [UnmanagedFunctionPointer(CallingConvention.StdCall)]
    private delegate int DllCanUnloadNow();
    // 私有变量
    private FREngine.IEngine engine = null;
    // FREngine.dll 句柄 
    private IntPtr dllHandle = IntPtr.Zero;
    private InitializeEngine initializeEngine = null;
    private DeinitializeEngine deinitializeEngine = null;
    private DllCanUnloadNow dllCanUnloadNow = null;
}

C++ (COM)

// 用 FREngine.dll 路径、您的 FineReader Engine 客户项目 ID，
// 和（如适用）在线许可证令牌路径和在线许可证密码初始化这些变量
wchar_t* FreDllPath;
wchar_t* CustomerProjectId;
wchar_t* LicensePath;  // 如果不使用在线许可证，则为这些变量分配空字符串
wchar_t* LicensePassword;
// FREngine.dll 的句柄
static HMODULE libraryHandle = 0;
// 全局 FineReader Engine 对象
FREngine::IEnginePtr Engine;
void LoadFREngine()
{
    if( Engine != 0 ) {
    // 已加载
    return;
    }
    // 第1步：加载 FREngine.dll
    if( libraryHandle == 0 ) {
        libraryHandle = LoadLibraryEx( FreDllPath, 0, LOAD_WITH_ALTERED_SEARCH_PATH );
        if( libraryHandle == 0 ) {
            throw L"加载 ABBYY FineReader Engine 是出错";
        }
    }
    // 第2步：获取 Engine 对象
    typedef HRESULT ( STDAPICALLTYPE* InitializeEngineFunc )( BSTR, BSTR, BSTR, BSTR, 
        BSTR, VARIANT_BOOL, FREngine::IEngine** );
    InitializeEngineFunc pInitializeEngine =
    ( InitializeEngineFunc )GetProcAddress( libraryHandle, "InitializeEngine");
    if( pInitializeEngine == 0 || pInitializeEngine( CustomerProjectId, LicensePath, 
        LicensePassword, L"", L"", VARIANT_FALSE, &Engine ) != S_OK ) {
    UnloadFREngine();
    throw L"加载 ABBYY FineReader Engine 时出错";
    }
}

第2步加载方案设置

第3步加载和预处理图像

第4步设置要识别的字段

现在需要创建包含您的字段的块，并指定每个块的类型和内部数据的已知特征。

使用 Analyze 方法执行文档布局分析，或者手动添加包含需要识别的字段的块。请参阅处理布局和块以了解相关说明。

现在，可以为每个字段指定其自身的识别参数。例如，如果某个字段包含一些文本，则使用 ITextBlock::RecognizerParams 属性：

通过 RecognizerParams 对象的 TextTypes 属性设置文本类型。例如，如果字段包含用邮政编码样式写下的数字，则使用 TT_Index 文本类型。
通过 SetPredefinedTextLanguage 方法设置语言。如果您知道字段中包含的信息类型，则使用特殊的预定义语言可能会很有帮助。例如，如果字段包含美国地址，则选择 English_US_Address 预定义语言。这可以确保更可靠地识别文本。
如果需要使用识别变体对结果进行进一步验证，请设置 RecognizerParams 对象的 SaveCharacterRecognitionVariants 和 SaveWordRecognitionVariants 属性（如下文第 6 步中所述）。Note that this setting is not available for handwritten or handprinted texts.

有关识别不同类型字段的更多详情，请参考识别复选标记、Recognizing Handwritten Texts、识别条形码和识别带空格的词汇部分。

C#

// 分析文档布局
frDocument.Analyze( null, null, null );
// 假设我们知道布局中的第一个块
// 包含美国地址
FREngine.ITextBlock addressBlock = frDocument.Pages[0].Layout.Blocks[0].GetAsTextBlock();
FREngine.IRecognizerParams paramsAddressBlock = addressBlock.RecognizerParams;
paramsAddressBlock.SetPredefinedTextLanguage( "English_US_Address" );
// 启用识别变体收集
paramsAddressBlock.SaveCharacterRecognitionVariants = true;
paramsAddressBlock.SaveWordRecognitionVariants = true;
// 用同样的方式设置其它布局块的属性
...

C++ (COM)

// 分析文档布局
frDocument->Analyze( 0, 0, 0 );
// 假设我们知道布局中的第一个块
// 包含美国地址
FREngine::ILayoutBlocksPtr layoutBlocks = frDocument->Pages->Item( 0 )->Layout->Blocks;
FREngine::IRecognizerParamsPtr paramsAddressBlock = layoutBlocks->Item( 0 )->GetAsTextBlock()->RecognizerParams;
paramsAddressBlock->SetPredefinedTextLanguage( L"English_US_Address" );
// 启用识别变体收集
paramsAddressBlock->SaveCharacterRecognitionVariants = VARIANT_TRUE;
paramsAddressBlock->SaveWordRecognitionVariants = VARIANT_TRUE;
// 用同样的方式设置其它布局块的属性
...

第5步识别

第6步处理已识别的数据

第7步卸载 ABBYY FineReader Engine

使用 ABBYY FineReader Engine 完成工作后，您需要卸载 Engine 对象。为此，请使用 DeinitializeEngine 导出功能。

C#

public class EngineLoader : IDisposable
{
    // 卸载 FineReader Engine
    public void Dispose()
    {
        if (engine == null)
        {
            // Engine 未加载 
            return;
        }
        engine = null;
        int hresult = deinitializeEngine();
        // 在 FreeLibrary 调用前删除所有对象
        GC.Collect();
        GC.WaitForPendingFinalizers();
        GC.Collect();
        int hresult = deinitializeEngine();

        hresult = dllCanUnloadNow();
        if (hresult == 0)
        {
            FreeLibrary(dllHandle);
        }
        dllHandle = IntPtr.Zero;
        initializeEngine = null;
        deinitializeEngine = null;
        dllCanUnloadNow = null;
        // 清理后引发异常
        Marshal.ThrowExceptionForHR(hresult);
    }
    // Kernel32.dll 函数
    [DllImport("kernel32.dll")]
    private static extern IntPtr LoadLibraryEx(string dllToLoad, IntPtr reserved, uint flags);
    private const uint LOAD_WITH_ALTERED_SEARCH_PATH = 0x00000008;
    [DllImport("kernel32.dll")]
    private static extern IntPtr GetProcAddress(IntPtr hModule, string procedureName);
    [DllImport("kernel32.dll")]
    private static extern bool FreeLibrary(IntPtr hModule);
    // FREngine.dll 函数
    [UnmanagedFunctionPointer(CallingConvention.StdCall, CharSet = CharSet.Unicode)]
    private delegate int InitializeEngine( string customerProjectId, string LicensePath, string LicensePassword, , , , ref FREngine.IEngine engine);
    [UnmanagedFunctionPointer(CallingConvention.StdCall)]
    private delegate int DeinitializeEngine();
    [UnmanagedFunctionPointer(CallingConvention.StdCall)]
    private delegate int DllCanUnloadNow();
    // 私有变量
    private FREngine.IEngine engine = null;
    // FREngine.dll 句柄
    private IntPtr dllHandle = IntPtr.Zero;
    private InitializeEngine initializeEngine = null;
    private DeinitializeEngine deinitializeEngine = null;
    private DllCanUnloadNow dllCanUnloadNow = null;
}

C++ (COM)

void UnloadFREngine()
{
if( libraryHandle == 0 ) {
  return;
 }
// 释放 Engine 对象
 Engine = 0;
// 取消初始化 FineReader Engine
typedef HRESULT ( STDAPICALLTYPE* DeinitializeEngineFunc )();
 DeinitializeEngineFunc pDeinitializeEngine =
  ( DeinitializeEngineFunc )GetProcAddress( libraryHandle, “DeinitializeEngine” );
if( pDeinitializeEngine == 0 || pDeinitializeEngine() != S_OK ) {
  throw L"卸载 ABBYY FineReader Engine 时出错";
 }
// 现在可以安全释放 FREngine.dll 库
 FreeLibrary( libraryHandle );
 libraryHandle = 0;
}

所需资源

您可以使用 FREngineDistribution.csv 文件来自动创建应用程序正常工作所需的文件列表。若要用该方案进行处理，请在栏5 (RequiredByModule) 中对以下值进行选择：

Core

Core.Resources

Opening

Opening, Processing

Processing

Processing.OCR

Processing.OCR, Processing.ICR

Processing.OCR.NaturalLanguages

Processing.OCR.NaturalLanguages, Processing.ICR.NaturalLanguages

如果修改标准场景，请相应更改所需的模块。您还需要指定界面语言、识别语言和应用程序使用的任何其他功能（例如，如果需要打开 PDF 文件，则使用 Opening.PDF；如果需要识别 CJK 语言中的文本，则使用 Processing.OCR.CJK）。请参阅借助 FREngineDistribution.csv 文件处理进一步了解详情。

其他优化

以下是帮助文件中的相关章节，您可以在其中找到有关如何为不同处理步骤设置参数的更多信息：

识别

处理语言
使用内置和自定义识别语言。
借助字典进行处理
使用字典来改善识别质量。
识别带空格的词汇
使用字典来识别带空格的词汇（例如 New York 等）。
手写体识别
使用 ICR（智能字符识别）。
识别复选标记
设置复选标记及复选标记组的识别。
ABBYY FineReader Engine 中的特殊预定义语言
包含特殊语言单位的识别语言列表：地址、日期和时间、人名等等。这些语言可以用于字段识别。

处理已识别的数据

处理文本
处理已识别文本、段落、词汇和字符。
使用投票 API
处理词汇和字符识别备选场景。

另请参阅

基本使用场景实现

11/7/2025 12:48:30 PM

Your use of this site is conditioned on Your continued compliance with the Terms of Use.

Terms of Use

Disclaimer of Warranty

Limitation of Liability

Transmission and Submission of Information

Downloads

Use of Content

Trademarks

Links to Third-Party Sites

Foreign Legislation

Subscription Terms

Partner Subscription Terms

字段别识别

场景实现

第1步加载 ABBYY FineReader Engine

C#

C++ (COM)

第2步加载方案设置

C#

C++ (COM)

第3步加载和预处理图像

C#

C++ (COM)

第4步设置要识别的字段

C#

C++ (COM)

第5步识别

C#

C++ (COM)

第6步处理已识别的数据

第7步卸载 ABBYY FineReader Engine

C#

C++ (COM)

所需资源

其他优化

另请参阅