~ubuntu-branches/ubuntu/vivid/tesseract/vivid

« back to all changes in this revision

Viewing changes to doc/html/a00719_source.html

  • Committer: Package Import Robot
  • Author(s): Jeff Breidenbach
  • Date: 2014-02-03 11:10:20 UTC
  • mfrom: (1.3.1) (19.1.1 experimental)
  • Revision ID: package-import@ubuntu.com-20140203111020-igquodd7pjlp3uri
Tags: 3.03.01-1
* New upstream release, includes critical fix to PDF rendering
* Complete leptonlib transition (see bug #735509)
* Promote from experimental to unstable

Show diffs side-by-side

added added

removed removed

Lines of Context:
 
1
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
 
2
<html xmlns="http://www.w3.org/1999/xhtml">
 
3
<head>
 
4
<meta http-equiv="Content-Type" content="text/xhtml;charset=UTF-8"/>
 
5
<meta http-equiv="X-UA-Compatible" content="IE=9"/>
 
6
<title>tesseract: /usr/local/google/home/jbreiden/tesseract-ocr-read-only/ccmain/tfacepp.cpp Source File</title>
 
7
 
 
8
<link href="tabs.css" rel="stylesheet" type="text/css"/>
 
9
<link href="doxygen.css" rel="stylesheet" type="text/css" />
 
10
<link href="navtree.css" rel="stylesheet" type="text/css"/>
 
11
<script type="text/javascript" src="jquery.js"></script>
 
12
<script type="text/javascript" src="resize.js"></script>
 
13
<script type="text/javascript" src="navtree.js"></script>
 
14
<script type="text/javascript">
 
15
  $(document).ready(initResizable);
 
16
</script>
 
17
<link href="search/search.css" rel="stylesheet" type="text/css"/>
 
18
<script type="text/javascript" src="search/search.js"></script>
 
19
<script type="text/javascript">
 
20
  $(document).ready(function() { searchBox.OnSelectItem(0); });
 
21
</script>
 
22
 
 
23
</head>
 
24
<body>
 
25
<div id="top"><!-- do not remove this div! -->
 
26
 
 
27
 
 
28
<div id="titlearea">
 
29
<table cellspacing="0" cellpadding="0">
 
30
 <tbody>
 
31
 <tr style="height: 56px;">
 
32
  
 
33
  
 
34
  <td style="padding-left: 0.5em;">
 
35
   <div id="projectname">tesseract
 
36
   &#160;<span id="projectnumber">3.03</span>
 
37
   </div>
 
38
   
 
39
  </td>
 
40
  
 
41
  
 
42
  
 
43
 </tr>
 
44
 </tbody>
 
45
</table>
 
46
</div>
 
47
 
 
48
<!-- Generated by Doxygen 1.7.6.1 -->
 
49
<script type="text/javascript">
 
50
var searchBox = new SearchBox("searchBox", "search",false,'Search');
 
51
</script>
 
52
  <div id="navrow1" class="tabs">
 
53
    <ul class="tablist">
 
54
      <li><a href="index.html"><span>Main&#160;Page</span></a></li>
 
55
      <li><a href="pages.html"><span>Related&#160;Pages</span></a></li>
 
56
      <li><a href="modules.html"><span>Modules</span></a></li>
 
57
      <li><a href="namespaces.html"><span>Namespaces</span></a></li>
 
58
      <li><a href="annotated.html"><span>Classes</span></a></li>
 
59
      <li class="current"><a href="files.html"><span>Files</span></a></li>
 
60
      <li>
 
61
        <div id="MSearchBox" class="MSearchBoxInactive">
 
62
        <span class="left">
 
63
          <img id="MSearchSelect" src="search/mag_sel.png"
 
64
               onmouseover="return searchBox.OnSearchSelectShow()"
 
65
               onmouseout="return searchBox.OnSearchSelectHide()"
 
66
               alt=""/>
 
67
          <input type="text" id="MSearchField" value="Search" accesskey="S"
 
68
               onfocus="searchBox.OnSearchFieldFocus(true)" 
 
69
               onblur="searchBox.OnSearchFieldFocus(false)" 
 
70
               onkeyup="searchBox.OnSearchFieldChange(event)"/>
 
71
          </span><span class="right">
 
72
            <a id="MSearchClose" href="javascript:searchBox.CloseResultsWindow()"><img id="MSearchCloseImg" border="0" src="search/close.png" alt=""/></a>
 
73
          </span>
 
74
        </div>
 
75
      </li>
 
76
    </ul>
 
77
  </div>
 
78
  <div id="navrow2" class="tabs2">
 
79
    <ul class="tablist">
 
80
      <li><a href="files.html"><span>File&#160;List</span></a></li>
 
81
      <li><a href="globals.html"><span>File&#160;Members</span></a></li>
 
82
    </ul>
 
83
  </div>
 
84
</div>
 
85
<div id="side-nav" class="ui-resizable side-nav-resizable">
 
86
  <div id="nav-tree">
 
87
    <div id="nav-tree-contents">
 
88
    </div>
 
89
  </div>
 
90
  <div id="splitbar" style="-moz-user-select:none;" 
 
91
       class="ui-resizable-handle">
 
92
  </div>
 
93
</div>
 
94
<script type="text/javascript">
 
95
  initNavTree('a00719.html','');
 
96
</script>
 
97
<div id="doc-content">
 
98
<div class="header">
 
99
  <div class="headertitle">
 
100
<div class="title">/usr/local/google/home/jbreiden/tesseract-ocr-read-only/ccmain/tfacepp.cpp</div>  </div>
 
101
</div><!--header-->
 
102
<div class="contents">
 
103
<a href="a00719.html">Go to the documentation of this file.</a><div class="fragment"><pre class="fragment"><a name="l00001"></a>00001 <span class="comment">/**********************************************************************</span>
 
104
<a name="l00002"></a>00002 <span class="comment"> * File:        tfacepp.cpp  (Formerly tface++.c)</span>
 
105
<a name="l00003"></a>00003 <span class="comment"> * Description: C++ side of the C/C++ Tess/Editor interface.</span>
 
106
<a name="l00004"></a>00004 <span class="comment"> * Author:                  Ray Smith</span>
 
107
<a name="l00005"></a>00005 <span class="comment"> * Created:                 Thu Apr 23 15:39:23 BST 1992</span>
 
108
<a name="l00006"></a>00006 <span class="comment"> *</span>
 
109
<a name="l00007"></a>00007 <span class="comment"> * (C) Copyright 1992, Hewlett-Packard Ltd.</span>
 
110
<a name="l00008"></a>00008 <span class="comment"> ** Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);</span>
 
111
<a name="l00009"></a>00009 <span class="comment"> ** you may not use this file except in compliance with the License.</span>
 
112
<a name="l00010"></a>00010 <span class="comment"> ** You may obtain a copy of the License at</span>
 
113
<a name="l00011"></a>00011 <span class="comment"> ** http://www.apache.org/licenses/LICENSE-2.0</span>
 
114
<a name="l00012"></a>00012 <span class="comment"> ** Unless required by applicable law or agreed to in writing, software</span>
 
115
<a name="l00013"></a>00013 <span class="comment"> ** distributed under the License is distributed on an &quot;AS IS&quot; BASIS,</span>
 
116
<a name="l00014"></a>00014 <span class="comment"> ** WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.</span>
 
117
<a name="l00015"></a>00015 <span class="comment"> ** See the License for the specific language governing permissions and</span>
 
118
<a name="l00016"></a>00016 <span class="comment"> ** limitations under the License.</span>
 
119
<a name="l00017"></a>00017 <span class="comment"> *</span>
 
120
<a name="l00018"></a>00018 <span class="comment"> **********************************************************************/</span>
 
121
<a name="l00019"></a>00019 
 
122
<a name="l00020"></a>00020 <span class="preprocessor">#ifdef _MSC_VER</span>
 
123
<a name="l00021"></a>00021 <span class="preprocessor"></span><span class="preprocessor">#pragma warning(disable:4244)  // Conversion warnings</span>
 
124
<a name="l00022"></a>00022 <span class="preprocessor"></span><span class="preprocessor">#pragma warning(disable:4305)  // int/float warnings</span>
 
125
<a name="l00023"></a>00023 <span class="preprocessor"></span><span class="preprocessor">#pragma warning(disable:4800)  // int/bool warnings</span>
 
126
<a name="l00024"></a>00024 <span class="preprocessor"></span><span class="preprocessor">#endif</span>
 
127
<a name="l00025"></a>00025 <span class="preprocessor"></span>
 
128
<a name="l00026"></a>00026 <span class="preprocessor">#include &lt;math.h&gt;</span>
 
129
<a name="l00027"></a>00027 
 
130
<a name="l00028"></a>00028 <span class="preprocessor">#include &quot;<a class="code" href="a00725.html">blamer.h</a>&quot;</span>
 
131
<a name="l00029"></a>00029 <span class="preprocessor">#include &quot;<a class="code" href="a00823.html">errcode.h</a>&quot;</span>
 
132
<a name="l00030"></a>00030 <span class="preprocessor">#include &quot;<a class="code" href="a00788.html">ratngs.h</a>&quot;</span>
 
133
<a name="l00031"></a>00031 <span class="preprocessor">#include &quot;<a class="code" href="a00705.html">reject.h</a>&quot;</span>
 
134
<a name="l00032"></a>00032 <span class="preprocessor">#include &quot;<a class="code" href="a00716.html">tesseractclass.h</a>&quot;</span>
 
135
<a name="l00033"></a>00033 <span class="preprocessor">#include &quot;<a class="code" href="a00804.html">werd.h</a>&quot;</span>
 
136
<a name="l00034"></a>00034 
 
137
<a name="l00035"></a><a class="code" href="a00719.html#a2d04ee68504dcaa7ee6f56e34ade9c00">00035</a> <span class="preprocessor">#define MAX_UNDIVIDED_LENGTH 24</span>
 
138
<a name="l00036"></a>00036 <span class="preprocessor"></span>
 
139
<a name="l00037"></a>00037 
 
140
<a name="l00038"></a>00038 
 
141
<a name="l00039"></a>00039 <span class="comment">/**********************************************************************</span>
 
142
<a name="l00040"></a>00040 <span class="comment"> * recog_word</span>
 
143
<a name="l00041"></a>00041 <span class="comment"> *</span>
 
144
<a name="l00042"></a>00042 <span class="comment"> * Convert the word to tess form and pass it to the tess segmenter.</span>
 
145
<a name="l00043"></a>00043 <span class="comment"> * Convert the output back to editor form.</span>
 
146
<a name="l00044"></a>00044 <span class="comment"> **********************************************************************/</span>
 
147
<a name="l00045"></a>00045 <span class="keyword">namespace </span><a class="code" href="a01266.html#afed58feacb84df2de88bdd613cfdba6d">tesseract</a> {
 
148
<a name="l00046"></a><a class="code" href="a00607.html#afaddf88458e02ecec1d99a453d1ab4f7">00046</a> <span class="keywordtype">void</span> <a class="code" href="a00607.html#afaddf88458e02ecec1d99a453d1ab4f7">Tesseract::recog_word</a>(<a class="code" href="a00650.html">WERD_RES</a> *word) {
 
149
<a name="l00047"></a>00047   <span class="keywordflow">if</span> (<a class="code" href="a00655.html#a42414bff69207de7a50e5b1cb0d1cdba">wordrec_skip_no_truth_words</a> &amp;&amp; (word-&gt;<a class="code" href="a00650.html#a267e5d5e9fe67117e47223c5d336b8ba">blamer_bundle</a> == NULL ||
 
150
<a name="l00048"></a>00048       word-&gt;<a class="code" href="a00650.html#a267e5d5e9fe67117e47223c5d336b8ba">blamer_bundle</a>-&gt;<a class="code" href="a00274.html#af1132d873bea38b5fc5309c55fad2438">incorrect_result_reason</a>() == <a class="code" href="a00725.html#a8faf52e106c04bfdc9898ffa90b821e1a25d5b9457d6a31e2e1114c0bf8d0a795">IRR_NO_TRUTH</a>)) {
 
151
<a name="l00049"></a>00049     <span class="keywordflow">if</span> (<a class="code" href="a00314.html#a0f934f0b39cb869d2a4973269fb696cf">classify_debug_level</a>) <a class="code" href="a00860.html#a02aa7cca2c3857c14716e8cca96ace6c">tprintf</a>(<span class="stringliteral">&quot;No truth for word - skipping\n&quot;</span>);
 
152
<a name="l00050"></a>00050     word-&gt;<a class="code" href="a00650.html#ae15f8f88b29e06811c9f821b9fb4af1f">tess_failed</a> = <span class="keyword">true</span>;
 
153
<a name="l00051"></a>00051     <span class="keywordflow">return</span>;
 
154
<a name="l00052"></a>00052   }
 
155
<a name="l00053"></a>00053   <a class="code" href="a00823.html#a93a603f4063a6b9403d81caa245a583b">ASSERT_HOST</a>(!word-&gt;<a class="code" href="a00650.html#ad1d449f93bb0150bc7ef0d9b59ed27ba">chopped_word</a>-&gt;<a class="code" href="a00635.html#a52fba22521039a79d8c1c8182f602dcc">blobs</a>.<a class="code" href="a00403.html#afb0d8c52a603b6aa965d63bbf06a27dd">empty</a>());
 
156
<a name="l00054"></a>00054   <a class="code" href="a00607.html#a9642391f61959a81d94ffa8123a6b221">recog_word_recursive</a>(word);
 
157
<a name="l00055"></a>00055   word-&gt;<a class="code" href="a00650.html#a6efe07c079a04a91985f99c71258a193">SetupBoxWord</a>();
 
158
<a name="l00056"></a>00056   <span class="keywordflow">if</span> (word-&gt;<a class="code" href="a00650.html#a3d42ac7ec121263e757c9b7160dfd50d">best_choice</a>-&gt;<a class="code" href="a00649.html#a7be59abe97b052dd3aaa324aea8c4a6c">length</a>() != word-&gt;<a class="code" href="a00650.html#a3a92c8c9750d78631d75998f008f366a">box_word</a>-&gt;<a class="code" href="a00287.html#afe001fe8fb7f2d3725b2ac2f542e9878">length</a>()) {
 
159
<a name="l00057"></a>00057     <a class="code" href="a00860.html#a02aa7cca2c3857c14716e8cca96ace6c">tprintf</a>(<span class="stringliteral">&quot;recog_word ASSERT FAIL String:\&quot;%s\&quot;; &quot;</span>
 
160
<a name="l00058"></a>00058             <span class="stringliteral">&quot;Strlen=%d; #Blobs=%d\n&quot;</span>,
 
161
<a name="l00059"></a>00059             word-&gt;<a class="code" href="a00650.html#a3d42ac7ec121263e757c9b7160dfd50d">best_choice</a>-&gt;<a class="code" href="a00649.html#a9f084172bbfc8604af49788aad12da36">debug_string</a>().<a class="code" href="a00557.html#a32beee43ecab1bed8bebc3466896ad6e">string</a>(),
 
162
<a name="l00060"></a>00060             word-&gt;<a class="code" href="a00650.html#a3d42ac7ec121263e757c9b7160dfd50d">best_choice</a>-&gt;<a class="code" href="a00649.html#a7be59abe97b052dd3aaa324aea8c4a6c">length</a>(), word-&gt;<a class="code" href="a00650.html#a3a92c8c9750d78631d75998f008f366a">box_word</a>-&gt;<a class="code" href="a00287.html#afe001fe8fb7f2d3725b2ac2f542e9878">length</a>());
 
163
<a name="l00061"></a>00061   }
 
164
<a name="l00062"></a>00062   <a class="code" href="a00823.html#a93a603f4063a6b9403d81caa245a583b">ASSERT_HOST</a>(word-&gt;<a class="code" href="a00650.html#a3d42ac7ec121263e757c9b7160dfd50d">best_choice</a>-&gt;<a class="code" href="a00649.html#a7be59abe97b052dd3aaa324aea8c4a6c">length</a>() == word-&gt;<a class="code" href="a00650.html#a3a92c8c9750d78631d75998f008f366a">box_word</a>-&gt;<a class="code" href="a00287.html#afe001fe8fb7f2d3725b2ac2f542e9878">length</a>());
 
165
<a name="l00063"></a>00063   <span class="comment">// Check that the ratings matrix size matches the sum of all the</span>
 
166
<a name="l00064"></a>00064   <span class="comment">// segmentation states.</span>
 
167
<a name="l00065"></a>00065   <span class="keywordflow">if</span> (!word-&gt;<a class="code" href="a00650.html#af19f51d26dcc2d247cfd61946b370643">StatesAllValid</a>()) {
 
168
<a name="l00066"></a>00066     <a class="code" href="a00860.html#a02aa7cca2c3857c14716e8cca96ace6c">tprintf</a>(<span class="stringliteral">&quot;Not all words have valid states relative to ratings matrix!!&quot;</span>);
 
169
<a name="l00067"></a>00067     word-&gt;<a class="code" href="a00650.html#a2be5015c1ede59804ac0f4d6c13c9dcd">DebugWordChoices</a>(<span class="keyword">true</span>, NULL);
 
170
<a name="l00068"></a>00068     <a class="code" href="a00823.html#a93a603f4063a6b9403d81caa245a583b">ASSERT_HOST</a>(word-&gt;<a class="code" href="a00650.html#af19f51d26dcc2d247cfd61946b370643">StatesAllValid</a>());
 
171
<a name="l00069"></a>00069   }
 
172
<a name="l00070"></a>00070   <span class="keywordflow">if</span> (<a class="code" href="a00607.html#ac8687ff521ac4877bfcd5328832e30be">tessedit_override_permuter</a>) {
 
173
<a name="l00071"></a>00071     <span class="comment">/* Override the permuter type if a straight dictionary check disagrees. */</span>
 
174
<a name="l00072"></a>00072     <a class="code" href="a00831.html#a458fe97f82495945f8071bb3c18d1783">uinT8</a> perm_type = word-&gt;<a class="code" href="a00650.html#a3d42ac7ec121263e757c9b7160dfd50d">best_choice</a>-&gt;<a class="code" href="a00649.html#a161ac137df2d063a6421728e6aa08fcb">permuter</a>();
 
175
<a name="l00073"></a>00073     <span class="keywordflow">if</span> ((perm_type != <a class="code" href="a00788.html#a18e2c75cefe9e5b78e8ce41aa5fa25bca616bdbcaed7dd414823b303af5c8b1f1">SYSTEM_DAWG_PERM</a>) &amp;&amp;
 
176
<a name="l00074"></a>00074         (perm_type != <a class="code" href="a00788.html#a18e2c75cefe9e5b78e8ce41aa5fa25bca4fd9d3b025ecc5ea8f2248fea29543e4">FREQ_DAWG_PERM</a>) &amp;&amp; (perm_type != <a class="code" href="a00788.html#a18e2c75cefe9e5b78e8ce41aa5fa25bca5e293e54fa687876197992131e779d54">USER_DAWG_PERM</a>)) {
 
177
<a name="l00075"></a>00075       <a class="code" href="a00831.html#a458fe97f82495945f8071bb3c18d1783">uinT8</a> real_dict_perm_type = <a class="code" href="a00655.html#a13f2efa710b3a68e30e8bc2f69bee578">dict_word</a>(*word-&gt;<a class="code" href="a00650.html#a3d42ac7ec121263e757c9b7160dfd50d">best_choice</a>);
 
178
<a name="l00076"></a>00076       <span class="keywordflow">if</span> (((real_dict_perm_type == <a class="code" href="a00788.html#a18e2c75cefe9e5b78e8ce41aa5fa25bca616bdbcaed7dd414823b303af5c8b1f1">SYSTEM_DAWG_PERM</a>) ||
 
179
<a name="l00077"></a>00077            (real_dict_perm_type == <a class="code" href="a00788.html#a18e2c75cefe9e5b78e8ce41aa5fa25bca4fd9d3b025ecc5ea8f2248fea29543e4">FREQ_DAWG_PERM</a>) ||
 
180
<a name="l00078"></a>00078            (real_dict_perm_type == <a class="code" href="a00788.html#a18e2c75cefe9e5b78e8ce41aa5fa25bca5e293e54fa687876197992131e779d54">USER_DAWG_PERM</a>)) &amp;&amp;
 
181
<a name="l00079"></a>00079           (<a class="code" href="a00607.html#ac86ef254f64fc56546e9382fb125f633">alpha_count</a>(word-&gt;<a class="code" href="a00650.html#a3d42ac7ec121263e757c9b7160dfd50d">best_choice</a>-&gt;<a class="code" href="a00649.html#a41d740f0accccdfb245d34d554122116">unichar_string</a>().<a class="code" href="a00557.html#a32beee43ecab1bed8bebc3466896ad6e">string</a>(),
 
182
<a name="l00080"></a>00080                        word-&gt;<a class="code" href="a00650.html#a3d42ac7ec121263e757c9b7160dfd50d">best_choice</a>-&gt;<a class="code" href="a00649.html#a93ab94b6fa6d5c0469fb52d66c62968c">unichar_lengths</a>().<a class="code" href="a00557.html#a32beee43ecab1bed8bebc3466896ad6e">string</a>()) &gt; 0)) {
 
183
<a name="l00081"></a>00081         word-&gt;<a class="code" href="a00650.html#a3d42ac7ec121263e757c9b7160dfd50d">best_choice</a>-&gt;<a class="code" href="a00649.html#a162d90ae016fbf55256591bbf01c0c03">set_permuter</a>(real_dict_perm_type);  <span class="comment">// use dict perm</span>
 
184
<a name="l00082"></a>00082       }
 
185
<a name="l00083"></a>00083     }
 
186
<a name="l00084"></a>00084     <span class="keywordflow">if</span> (<a class="code" href="a00607.html#ab92cd0aa3a10873a0ce6f28666063a2a">tessedit_rejection_debug</a> &amp;&amp;
 
187
<a name="l00085"></a>00085         perm_type != word-&gt;<a class="code" href="a00650.html#a3d42ac7ec121263e757c9b7160dfd50d">best_choice</a>-&gt;<a class="code" href="a00649.html#a161ac137df2d063a6421728e6aa08fcb">permuter</a>()) {
 
188
<a name="l00086"></a>00086       <a class="code" href="a00860.html#a02aa7cca2c3857c14716e8cca96ace6c">tprintf</a>(<span class="stringliteral">&quot;Permuter Type Flipped from %d to %d\n&quot;</span>,
 
189
<a name="l00087"></a>00087               perm_type, word-&gt;<a class="code" href="a00650.html#a3d42ac7ec121263e757c9b7160dfd50d">best_choice</a>-&gt;<a class="code" href="a00649.html#a161ac137df2d063a6421728e6aa08fcb">permuter</a>());
 
190
<a name="l00088"></a>00088     }
 
191
<a name="l00089"></a>00089   }
 
192
<a name="l00090"></a>00090   <span class="comment">// Factored out from control.cpp</span>
 
193
<a name="l00091"></a>00091   <a class="code" href="a00823.html#a93a603f4063a6b9403d81caa245a583b">ASSERT_HOST</a>((word-&gt;<a class="code" href="a00650.html#a3d42ac7ec121263e757c9b7160dfd50d">best_choice</a> == NULL) == (word-&gt;<a class="code" href="a00650.html#ab4d02a7548dab0a4522f02ed90e48100">raw_choice</a> == NULL));
 
194
<a name="l00092"></a>00092   <span class="keywordflow">if</span> (word-&gt;<a class="code" href="a00650.html#a3d42ac7ec121263e757c9b7160dfd50d">best_choice</a> == NULL || word-&gt;<a class="code" href="a00650.html#a3d42ac7ec121263e757c9b7160dfd50d">best_choice</a>-&gt;<a class="code" href="a00649.html#a7be59abe97b052dd3aaa324aea8c4a6c">length</a>() == 0 ||
 
195
<a name="l00093"></a>00093       <span class="keyword">static_cast&lt;</span><span class="keywordtype">int</span><span class="keyword">&gt;</span>(strspn(word-&gt;<a class="code" href="a00650.html#a3d42ac7ec121263e757c9b7160dfd50d">best_choice</a>-&gt;<a class="code" href="a00649.html#a41d740f0accccdfb245d34d554122116">unichar_string</a>().<a class="code" href="a00557.html#a32beee43ecab1bed8bebc3466896ad6e">string</a>(),
 
196
<a name="l00094"></a>00094                               <span class="stringliteral">&quot; &quot;</span>)) == word-&gt;<a class="code" href="a00650.html#a3d42ac7ec121263e757c9b7160dfd50d">best_choice</a>-&gt;<a class="code" href="a00649.html#a7be59abe97b052dd3aaa324aea8c4a6c">length</a>()) {
 
197
<a name="l00095"></a>00095     word-&gt;<a class="code" href="a00650.html#ae15f8f88b29e06811c9f821b9fb4af1f">tess_failed</a> = <span class="keyword">true</span>;
 
198
<a name="l00096"></a>00096     word-&gt;<a class="code" href="a00650.html#ae24eb58be06cf275aee411d947fd31ef">reject_map</a>.<a class="code" href="a00517.html#a487e7d5d02b1fd1e142578ab4614f05b">initialise</a>(word-&gt;<a class="code" href="a00650.html#a3a92c8c9750d78631d75998f008f366a">box_word</a>-&gt;<a class="code" href="a00287.html#afe001fe8fb7f2d3725b2ac2f542e9878">length</a>());
 
199
<a name="l00097"></a>00097     word-&gt;<a class="code" href="a00650.html#ae24eb58be06cf275aee411d947fd31ef">reject_map</a>.<a class="code" href="a00517.html#ac1d7e8e50b633e7c1b9e25904567f86b">rej_word_tess_failure</a>();
 
200
<a name="l00098"></a>00098   } <span class="keywordflow">else</span> {
 
201
<a name="l00099"></a>00099     word-&gt;<a class="code" href="a00650.html#ae15f8f88b29e06811c9f821b9fb4af1f">tess_failed</a> = <span class="keyword">false</span>;
 
202
<a name="l00100"></a>00100   }
 
203
<a name="l00101"></a>00101 }
 
204
<a name="l00102"></a>00102 
 
205
<a name="l00103"></a>00103 
 
206
<a name="l00104"></a>00104 <span class="comment">/**********************************************************************</span>
 
207
<a name="l00105"></a>00105 <span class="comment"> * recog_word_recursive</span>
 
208
<a name="l00106"></a>00106 <span class="comment"> *</span>
 
209
<a name="l00107"></a>00107 <span class="comment"> * Convert the word to tess form and pass it to the tess segmenter.</span>
 
210
<a name="l00108"></a>00108 <span class="comment"> * Convert the output back to editor form.</span>
 
211
<a name="l00109"></a>00109 <span class="comment"> **********************************************************************/</span>
 
212
<a name="l00110"></a><a class="code" href="a00607.html#a9642391f61959a81d94ffa8123a6b221">00110</a> <span class="keywordtype">void</span> <a class="code" href="a00607.html#a9642391f61959a81d94ffa8123a6b221">Tesseract::recog_word_recursive</a>(<a class="code" href="a00650.html">WERD_RES</a> *word) {
 
213
<a name="l00111"></a>00111   <span class="keywordtype">int</span> word_length = word-&gt;<a class="code" href="a00650.html#ad1d449f93bb0150bc7ef0d9b59ed27ba">chopped_word</a>-&gt;<a class="code" href="a00635.html#adfdef9868e61650e076775011382ec70">NumBlobs</a>();  <span class="comment">// no of blobs</span>
 
214
<a name="l00112"></a>00112   <span class="keywordflow">if</span> (word_length &gt; <a class="code" href="a00719.html#a2d04ee68504dcaa7ee6f56e34ade9c00">MAX_UNDIVIDED_LENGTH</a>) {
 
215
<a name="l00113"></a>00113     <span class="keywordflow">return</span> <a class="code" href="a00607.html#a539f90c9755f9732b809cfdaf2d4cd98">split_and_recog_word</a>(word);
 
216
<a name="l00114"></a>00114   }
 
217
<a name="l00115"></a>00115   <a class="code" href="a00655.html#ae0ce1e8084b0bbe6f9d45a35af30eac4">cc_recog</a>(word);
 
218
<a name="l00116"></a>00116   word_length = word-&gt;<a class="code" href="a00650.html#a211ab5c5a13123ee7bdc7459d3363f9d">rebuild_word</a>-&gt;<a class="code" href="a00635.html#adfdef9868e61650e076775011382ec70">NumBlobs</a>();  <span class="comment">// No of blobs in output.</span>
 
219
<a name="l00117"></a>00117 
 
220
<a name="l00118"></a>00118   <span class="comment">// Do sanity checks and minor fixes on best_choice.</span>
 
221
<a name="l00119"></a>00119   <span class="keywordflow">if</span> (word-&gt;<a class="code" href="a00650.html#a3d42ac7ec121263e757c9b7160dfd50d">best_choice</a>-&gt;<a class="code" href="a00649.html#a7be59abe97b052dd3aaa324aea8c4a6c">length</a>() &gt; word_length) {
 
222
<a name="l00120"></a>00120     word-&gt;<a class="code" href="a00650.html#a3d42ac7ec121263e757c9b7160dfd50d">best_choice</a>-&gt;<a class="code" href="a00649.html#aad71e860a573a615ce8958898b2657fb" title="Set the fields in this choice to be default (bad) values.">make_bad</a>();  <span class="comment">// should never happen</span>
 
223
<a name="l00121"></a>00121     <a class="code" href="a00860.html#a02aa7cca2c3857c14716e8cca96ace6c">tprintf</a>(<span class="stringliteral">&quot;recog_word: Discarded long string \&quot;%s\&quot;&quot;</span>
 
224
<a name="l00122"></a>00122             <span class="stringliteral">&quot; (%d characters vs %d blobs)\n&quot;</span>,
 
225
<a name="l00123"></a>00123             word-&gt;<a class="code" href="a00650.html#a3d42ac7ec121263e757c9b7160dfd50d">best_choice</a>-&gt;<a class="code" href="a00649.html#a41d740f0accccdfb245d34d554122116">unichar_string</a>().<a class="code" href="a00557.html#a32beee43ecab1bed8bebc3466896ad6e">string</a>(),
 
226
<a name="l00124"></a>00124             word-&gt;<a class="code" href="a00650.html#a3d42ac7ec121263e757c9b7160dfd50d">best_choice</a>-&gt;<a class="code" href="a00649.html#a7be59abe97b052dd3aaa324aea8c4a6c">length</a>(), word_length);
 
227
<a name="l00125"></a>00125     <a class="code" href="a00860.html#a02aa7cca2c3857c14716e8cca96ace6c">tprintf</a>(<span class="stringliteral">&quot;Word is at:&quot;</span>);
 
228
<a name="l00126"></a>00126     word-&gt;<a class="code" href="a00650.html#afc15fa7c1b5ad55d6772dea0d6865df1">word</a>-&gt;<a class="code" href="a00648.html#a151bbfb39ecdef93ab1a14b0f9e4ac74">bounding_box</a>().<a class="code" href="a00592.html#a2e753aa9943276301d68e9f9cad99620">print</a>();
 
229
<a name="l00127"></a>00127   }
 
230
<a name="l00128"></a>00128   <span class="keywordflow">if</span> (word-&gt;<a class="code" href="a00650.html#a3d42ac7ec121263e757c9b7160dfd50d">best_choice</a>-&gt;<a class="code" href="a00649.html#a7be59abe97b052dd3aaa324aea8c4a6c">length</a>() &lt; word_length) {
 
231
<a name="l00129"></a>00129     <a class="code" href="a00862.html#a8578b19fa1ff5ca75080db1a18ecc32e">UNICHAR_ID</a> space_id = <a class="code" href="a00295.html#a69c5179ac5f10a24f3f97e16ca09460f">unicharset</a>.<a class="code" href="a00642.html#ae786fa834962ef4d6dbf8300c6c5d456">unichar_to_id</a>(<span class="stringliteral">&quot; &quot;</span>);
 
232
<a name="l00130"></a>00130     <span class="keywordflow">while</span> (word-&gt;<a class="code" href="a00650.html#a3d42ac7ec121263e757c9b7160dfd50d">best_choice</a>-&gt;<a class="code" href="a00649.html#a7be59abe97b052dd3aaa324aea8c4a6c">length</a>() &lt; word_length) {
 
233
<a name="l00131"></a>00131       word-&gt;<a class="code" href="a00650.html#a3d42ac7ec121263e757c9b7160dfd50d">best_choice</a>-&gt;<a class="code" href="a00649.html#af0730ae4bad7d0e705422f0574d9ff1e">append_unichar_id</a>(space_id, 1, 0.0,
 
234
<a name="l00132"></a>00132                                            word-&gt;<a class="code" href="a00650.html#a3d42ac7ec121263e757c9b7160dfd50d">best_choice</a>-&gt;<a class="code" href="a00649.html#a1b25ef2b44d21a7204483a7ca804f293">certainty</a>());
 
235
<a name="l00133"></a>00133     }
 
236
<a name="l00134"></a>00134   }
 
237
<a name="l00135"></a>00135 }
 
238
<a name="l00136"></a>00136 
 
239
<a name="l00137"></a>00137 
 
240
<a name="l00138"></a>00138 <span class="comment">/**********************************************************************</span>
 
241
<a name="l00139"></a>00139 <span class="comment"> * split_and_recog_word</span>
 
242
<a name="l00140"></a>00140 <span class="comment"> *</span>
 
243
<a name="l00141"></a>00141 <span class="comment"> * Split the word into 2 smaller pieces at the largest gap.</span>
 
244
<a name="l00142"></a>00142 <span class="comment"> * Recognize the pieces and stick the results back together.</span>
 
245
<a name="l00143"></a>00143 <span class="comment"> **********************************************************************/</span>
 
246
<a name="l00144"></a><a class="code" href="a00607.html#a539f90c9755f9732b809cfdaf2d4cd98">00144</a> <span class="keywordtype">void</span> <a class="code" href="a00607.html#a539f90c9755f9732b809cfdaf2d4cd98">Tesseract::split_and_recog_word</a>(<a class="code" href="a00650.html">WERD_RES</a> *word) {
 
247
<a name="l00145"></a>00145   <span class="comment">// Find the biggest blob gap in the chopped_word.</span>
 
248
<a name="l00146"></a>00146   <span class="keywordtype">int</span> bestgap = -<a class="code" href="a00831.html#aac62d87844689a18b6f5339a89ed6e7f">MAX_INT32</a>;
 
249
<a name="l00147"></a>00147   <span class="keywordtype">int</span> split_index = 0;
 
250
<a name="l00148"></a>00148   <span class="keywordflow">for</span> (<span class="keywordtype">int</span> b = 1; b &lt; word-&gt;<a class="code" href="a00650.html#ad1d449f93bb0150bc7ef0d9b59ed27ba">chopped_word</a>-&gt;<a class="code" href="a00635.html#adfdef9868e61650e076775011382ec70">NumBlobs</a>(); ++b) {
 
251
<a name="l00149"></a>00149     <a class="code" href="a00592.html">TBOX</a> prev_box = word-&gt;<a class="code" href="a00650.html#ad1d449f93bb0150bc7ef0d9b59ed27ba">chopped_word</a>-&gt;<a class="code" href="a00635.html#a52fba22521039a79d8c1c8182f602dcc">blobs</a>[b - 1]-&gt;bounding_box();
 
252
<a name="l00150"></a>00150     <a class="code" href="a00592.html">TBOX</a> blob_box = word-&gt;<a class="code" href="a00650.html#ad1d449f93bb0150bc7ef0d9b59ed27ba">chopped_word</a>-&gt;<a class="code" href="a00635.html#a52fba22521039a79d8c1c8182f602dcc">blobs</a>[b]-&gt;bounding_box();
 
253
<a name="l00151"></a>00151     <span class="keywordtype">int</span> gap = blob_box.<a class="code" href="a00592.html#a724fabf566586b663577dfa944ffbc61">left</a>() - prev_box.<a class="code" href="a00592.html#a8703081c1a1c26db3a4dddaca1028e34">right</a>();
 
254
<a name="l00152"></a>00152     <span class="keywordflow">if</span> (gap &gt; bestgap) {
 
255
<a name="l00153"></a>00153       bestgap = gap;
 
256
<a name="l00154"></a>00154       split_index = b;
 
257
<a name="l00155"></a>00155     }
 
258
<a name="l00156"></a>00156   }
 
259
<a name="l00157"></a>00157   <a class="code" href="a00823.html#a93a603f4063a6b9403d81caa245a583b">ASSERT_HOST</a>(split_index &gt; 0);
 
260
<a name="l00158"></a>00158 
 
261
<a name="l00159"></a>00159   <a class="code" href="a00650.html">WERD_RES</a> *word2 = NULL;
 
262
<a name="l00160"></a>00160   <a class="code" href="a00274.html">BlamerBundle</a> *orig_bb = NULL;
 
263
<a name="l00161"></a>00161   <a class="code" href="a00607.html#abf10ca6bceafbca08eb585679b06ffb9">split_word</a>(word, split_index, &amp;word2, &amp;orig_bb);
 
264
<a name="l00162"></a>00162 
 
265
<a name="l00163"></a>00163   <span class="comment">// Recognize the first part of the word.</span>
 
266
<a name="l00164"></a>00164   <a class="code" href="a00607.html#a9642391f61959a81d94ffa8123a6b221">recog_word_recursive</a>(word);
 
267
<a name="l00165"></a>00165   <span class="comment">// Recognize the second part of the word.</span>
 
268
<a name="l00166"></a>00166   <a class="code" href="a00607.html#a9642391f61959a81d94ffa8123a6b221">recog_word_recursive</a>(word2);
 
269
<a name="l00167"></a>00167 
 
270
<a name="l00168"></a>00168   <a class="code" href="a00607.html#a2e5e3d8611a06d346cda1179b669fdb7">join_words</a>(word, word2, orig_bb);
 
271
<a name="l00169"></a>00169 }
 
272
<a name="l00170"></a>00170 
 
273
<a name="l00171"></a>00171 
 
274
<a name="l00172"></a>00172 <span class="comment">/**********************************************************************</span>
 
275
<a name="l00173"></a>00173 <span class="comment"> * split_word</span>
 
276
<a name="l00174"></a>00174 <span class="comment"> *</span>
 
277
<a name="l00175"></a>00175 <span class="comment"> * Split a given WERD_RES in place into two smaller words for recognition.</span>
 
278
<a name="l00176"></a>00176 <span class="comment"> * split_pt is the index of the first blob to go in the second word.</span>
 
279
<a name="l00177"></a>00177 <span class="comment"> * The underlying word is left alone, only the TWERD (and subsequent data)</span>
 
280
<a name="l00178"></a>00178 <span class="comment"> * are split up.  orig_blamer_bundle is set to the original blamer bundle,</span>
 
281
<a name="l00179"></a>00179 <span class="comment"> * and will now be owned by the caller.  New blamer bundles are forged for the</span>
 
282
<a name="l00180"></a>00180 <span class="comment"> * two pieces.</span>
 
283
<a name="l00181"></a>00181 <span class="comment"> **********************************************************************/</span>
 
284
<a name="l00182"></a><a class="code" href="a00607.html#abf10ca6bceafbca08eb585679b06ffb9">00182</a> <span class="keywordtype">void</span> <a class="code" href="a00607.html#abf10ca6bceafbca08eb585679b06ffb9">Tesseract::split_word</a>(<a class="code" href="a00650.html">WERD_RES</a> *word,
 
285
<a name="l00183"></a>00183                            <span class="keywordtype">int</span> split_pt,
 
286
<a name="l00184"></a>00184                            <a class="code" href="a00650.html">WERD_RES</a> **right_piece,
 
287
<a name="l00185"></a>00185                            <a class="code" href="a00274.html">BlamerBundle</a> **orig_blamer_bundle)<span class="keyword"> const </span>{
 
288
<a name="l00186"></a>00186   <a class="code" href="a00823.html#a93a603f4063a6b9403d81caa245a583b">ASSERT_HOST</a>(split_pt &gt;0 &amp;&amp; split_pt &lt; word-&gt;chopped_word-&gt;NumBlobs());
 
289
<a name="l00187"></a>00187 
 
290
<a name="l00188"></a>00188   <span class="comment">// Save a copy of the blamer bundle so we can try to reconstruct it below.</span>
 
291
<a name="l00189"></a>00189   <a class="code" href="a00274.html">BlamerBundle</a> *orig_bb =
 
292
<a name="l00190"></a>00190       word-&gt;<a class="code" href="a00650.html#a267e5d5e9fe67117e47223c5d336b8ba">blamer_bundle</a> ? <span class="keyword">new</span> <a class="code" href="a00274.html">BlamerBundle</a>(*word-&gt;<a class="code" href="a00650.html#a267e5d5e9fe67117e47223c5d336b8ba">blamer_bundle</a>) : NULL;
 
293
<a name="l00191"></a>00191 
 
294
<a name="l00192"></a>00192   <a class="code" href="a00650.html">WERD_RES</a> *word2 = <span class="keyword">new</span> <a class="code" href="a00650.html">WERD_RES</a>(*word);
 
295
<a name="l00193"></a>00193 
 
296
<a name="l00194"></a>00194   <span class="comment">// blow away the copied chopped_word, as we want to work with</span>
 
297
<a name="l00195"></a>00195   <span class="comment">// the blobs from the input chopped_word so seam_arrays can be merged.</span>
 
298
<a name="l00196"></a>00196   <a class="code" href="a00635.html">TWERD</a> *chopped = word-&gt;<a class="code" href="a00650.html#ad1d449f93bb0150bc7ef0d9b59ed27ba">chopped_word</a>;
 
299
<a name="l00197"></a>00197   <a class="code" href="a00635.html">TWERD</a> *chopped2 = <span class="keyword">new</span> <a class="code" href="a00635.html">TWERD</a>;
 
300
<a name="l00198"></a>00198   chopped2-&gt;<a class="code" href="a00635.html#a52fba22521039a79d8c1c8182f602dcc">blobs</a>.<a class="code" href="a00403.html#aa225ea3fc9374961482bc804028317eb">reserve</a>(chopped-&gt;<a class="code" href="a00635.html#adfdef9868e61650e076775011382ec70">NumBlobs</a>() - split_pt);
 
301
<a name="l00199"></a>00199   <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = split_pt; i &lt; chopped-&gt;<a class="code" href="a00635.html#adfdef9868e61650e076775011382ec70">NumBlobs</a>(); ++i) {
 
302
<a name="l00200"></a>00200     chopped2-&gt;<a class="code" href="a00635.html#a52fba22521039a79d8c1c8182f602dcc">blobs</a>.<a class="code" href="a00403.html#a0dc89fe2a365b04a61017f9d78c1a303">push_back</a>(chopped-&gt;<a class="code" href="a00635.html#a52fba22521039a79d8c1c8182f602dcc">blobs</a>[i]);
 
303
<a name="l00201"></a>00201   }
 
304
<a name="l00202"></a>00202   chopped-&gt;<a class="code" href="a00635.html#a52fba22521039a79d8c1c8182f602dcc">blobs</a>.<a class="code" href="a00403.html#a980882b5ebc3e72fdedbdbe345196f21">truncate</a>(split_pt);
 
305
<a name="l00203"></a>00203   word-&gt;<a class="code" href="a00650.html#ad1d449f93bb0150bc7ef0d9b59ed27ba">chopped_word</a> = NULL;
 
306
<a name="l00204"></a>00204   <span class="keyword">delete</span> word2-&gt;<a class="code" href="a00650.html#ad1d449f93bb0150bc7ef0d9b59ed27ba">chopped_word</a>;
 
307
<a name="l00205"></a>00205   word2-&gt;<a class="code" href="a00650.html#ad1d449f93bb0150bc7ef0d9b59ed27ba">chopped_word</a> = NULL;
 
308
<a name="l00206"></a>00206 
 
309
<a name="l00207"></a>00207   <span class="keyword">const</span> <a class="code" href="a00642.html">UNICHARSET</a> &amp;<a class="code" href="a00295.html#a69c5179ac5f10a24f3f97e16ca09460f">unicharset</a> = *word-&gt;<a class="code" href="a00650.html#a053a2aeeddc26a93a41a04fa08dd688a">uch_set</a>;
 
310
<a name="l00208"></a>00208   word-&gt;<a class="code" href="a00650.html#a6ef9853bc0dca7249a30c897bcba4aba">ClearResults</a>();
 
311
<a name="l00209"></a>00209   word2-&gt;<a class="code" href="a00650.html#a6ef9853bc0dca7249a30c897bcba4aba">ClearResults</a>();
 
312
<a name="l00210"></a>00210   word-&gt;<a class="code" href="a00650.html#ad1d449f93bb0150bc7ef0d9b59ed27ba">chopped_word</a> = chopped;
 
313
<a name="l00211"></a>00211   word2-&gt;<a class="code" href="a00650.html#ad1d449f93bb0150bc7ef0d9b59ed27ba">chopped_word</a> = chopped2;
 
314
<a name="l00212"></a>00212   word-&gt;<a class="code" href="a00650.html#ac81aedd52598dffd0f11ca74ee86be6f">SetupBasicsFromChoppedWord</a>(unicharset);
 
315
<a name="l00213"></a>00213   word2-&gt;<a class="code" href="a00650.html#ac81aedd52598dffd0f11ca74ee86be6f">SetupBasicsFromChoppedWord</a>(unicharset);
 
316
<a name="l00214"></a>00214 
 
317
<a name="l00215"></a>00215   <span class="comment">// Try to adjust the blamer bundle.</span>
 
318
<a name="l00216"></a>00216   <span class="keywordflow">if</span> (orig_bb != NULL) {
 
319
<a name="l00217"></a>00217     <span class="comment">// TODO(rays) Looks like a leak to me.</span>
 
320
<a name="l00218"></a>00218     <span class="comment">// orig_bb should take, rather than copy.</span>
 
321
<a name="l00219"></a>00219     word-&gt;<a class="code" href="a00650.html#a267e5d5e9fe67117e47223c5d336b8ba">blamer_bundle</a> = <span class="keyword">new</span> <a class="code" href="a00274.html">BlamerBundle</a>();
 
322
<a name="l00220"></a>00220     word2-&gt;<a class="code" href="a00650.html#a267e5d5e9fe67117e47223c5d336b8ba">blamer_bundle</a> = <span class="keyword">new</span> <a class="code" href="a00274.html">BlamerBundle</a>();
 
323
<a name="l00221"></a>00221     orig_bb-&gt;SplitBundle(chopped-&gt;<a class="code" href="a00635.html#a52fba22521039a79d8c1c8182f602dcc">blobs</a>.<a class="code" href="a00403.html#a6e6d6497a6f7dd999b6d591c15354167">back</a>()-&gt;<a class="code" href="a00591.html#a8f1f8f110170fe12cf8147d504cd0ea2">bounding_box</a>().<a class="code" href="a00592.html#a8703081c1a1c26db3a4dddaca1028e34">right</a>(),
 
324
<a name="l00222"></a>00222                          word2-&gt;<a class="code" href="a00650.html#ad1d449f93bb0150bc7ef0d9b59ed27ba">chopped_word</a>-&gt;<a class="code" href="a00635.html#a52fba22521039a79d8c1c8182f602dcc">blobs</a>[0]-&gt;bounding_box().left(),
 
325
<a name="l00223"></a>00223                          <a class="code" href="a00655.html#a76e95cb7cbfe636ab00ec46150b5524d">wordrec_debug_blamer</a>,
 
326
<a name="l00224"></a>00224                          word-&gt;<a class="code" href="a00650.html#a267e5d5e9fe67117e47223c5d336b8ba">blamer_bundle</a>, word2-&gt;<a class="code" href="a00650.html#a267e5d5e9fe67117e47223c5d336b8ba">blamer_bundle</a>);
 
327
<a name="l00225"></a>00225   }
 
328
<a name="l00226"></a>00226 
 
329
<a name="l00227"></a>00227   *right_piece = word2;
 
330
<a name="l00228"></a>00228   *orig_blamer_bundle = orig_bb;
 
331
<a name="l00229"></a>00229 }
 
332
<a name="l00230"></a>00230 
 
333
<a name="l00231"></a>00231 
 
334
<a name="l00232"></a>00232 <span class="comment">/**********************************************************************</span>
 
335
<a name="l00233"></a>00233 <span class="comment"> * join_words</span>
 
336
<a name="l00234"></a>00234 <span class="comment"> *</span>
 
337
<a name="l00235"></a>00235 <span class="comment"> * The opposite of split_word():</span>
 
338
<a name="l00236"></a>00236 <span class="comment"> *  join word2 (including any recognized data / seam array / etc)</span>
 
339
<a name="l00237"></a>00237 <span class="comment"> *  onto the right of word and then delete word2.</span>
 
340
<a name="l00238"></a>00238 <span class="comment"> *  Also, if orig_bb is provided, stitch it back into word.</span>
 
341
<a name="l00239"></a>00239 <span class="comment"> **********************************************************************/</span>
 
342
<a name="l00240"></a><a class="code" href="a00607.html#a2e5e3d8611a06d346cda1179b669fdb7">00240</a> <span class="keywordtype">void</span> <a class="code" href="a00607.html#a2e5e3d8611a06d346cda1179b669fdb7">Tesseract::join_words</a>(<a class="code" href="a00650.html">WERD_RES</a> *word,
 
343
<a name="l00241"></a>00241                            <a class="code" href="a00650.html">WERD_RES</a> *word2,
 
344
<a name="l00242"></a>00242                            <a class="code" href="a00274.html">BlamerBundle</a> *orig_bb)<span class="keyword"> const </span>{
 
345
<a name="l00243"></a>00243   <a class="code" href="a00592.html">TBOX</a> prev_box = word-&gt;<a class="code" href="a00650.html#ad1d449f93bb0150bc7ef0d9b59ed27ba">chopped_word</a>-&gt;<a class="code" href="a00635.html#a52fba22521039a79d8c1c8182f602dcc">blobs</a>.<a class="code" href="a00403.html#a6e6d6497a6f7dd999b6d591c15354167">back</a>()-&gt;<a class="code" href="a00591.html#a8f1f8f110170fe12cf8147d504cd0ea2">bounding_box</a>();
 
346
<a name="l00244"></a>00244   <a class="code" href="a00592.html">TBOX</a> blob_box = word2-&gt;<a class="code" href="a00650.html#ad1d449f93bb0150bc7ef0d9b59ed27ba">chopped_word</a>-&gt;<a class="code" href="a00635.html#a52fba22521039a79d8c1c8182f602dcc">blobs</a>[0]-&gt;bounding_box();
 
347
<a name="l00245"></a>00245   <span class="comment">// Tack the word2 outputs onto the end of the word outputs.</span>
 
348
<a name="l00246"></a>00246   word-&gt;<a class="code" href="a00650.html#ad1d449f93bb0150bc7ef0d9b59ed27ba">chopped_word</a>-&gt;<a class="code" href="a00635.html#a52fba22521039a79d8c1c8182f602dcc">blobs</a> += word2-&gt;<a class="code" href="a00650.html#ad1d449f93bb0150bc7ef0d9b59ed27ba">chopped_word</a>-&gt;<a class="code" href="a00635.html#a52fba22521039a79d8c1c8182f602dcc">blobs</a>;
 
349
<a name="l00247"></a>00247   word-&gt;<a class="code" href="a00650.html#a211ab5c5a13123ee7bdc7459d3363f9d">rebuild_word</a>-&gt;<a class="code" href="a00635.html#a52fba22521039a79d8c1c8182f602dcc">blobs</a> += word2-&gt;<a class="code" href="a00650.html#a211ab5c5a13123ee7bdc7459d3363f9d">rebuild_word</a>-&gt;<a class="code" href="a00635.html#a52fba22521039a79d8c1c8182f602dcc">blobs</a>;
 
350
<a name="l00248"></a>00248   word2-&gt;<a class="code" href="a00650.html#ad1d449f93bb0150bc7ef0d9b59ed27ba">chopped_word</a>-&gt;<a class="code" href="a00635.html#a52fba22521039a79d8c1c8182f602dcc">blobs</a>.<a class="code" href="a00403.html#a9cdbff49b186574b83e43afba606fdd9">clear</a>();
 
351
<a name="l00249"></a>00249   word2-&gt;<a class="code" href="a00650.html#a211ab5c5a13123ee7bdc7459d3363f9d">rebuild_word</a>-&gt;<a class="code" href="a00635.html#a52fba22521039a79d8c1c8182f602dcc">blobs</a>.<a class="code" href="a00403.html#a9cdbff49b186574b83e43afba606fdd9">clear</a>();
 
352
<a name="l00250"></a>00250   <a class="code" href="a00629.html">TPOINT</a> split_pt;
 
353
<a name="l00251"></a>00251   split_pt.<a class="code" href="a00629.html#aa9c98655c3a2a0437821e5a3d3418b0f">x</a> = (prev_box.<a class="code" href="a00592.html#a8703081c1a1c26db3a4dddaca1028e34">right</a>() + blob_box.<a class="code" href="a00592.html#a724fabf566586b663577dfa944ffbc61">left</a>()) / 2;
 
354
<a name="l00252"></a>00252   split_pt.<a class="code" href="a00629.html#a6d62f015b74612e43975e439a096039c">y</a> = (prev_box.<a class="code" href="a00592.html#adf92e9fdac1bdf11c10d1c4d1178791a">top</a>() + prev_box.<a class="code" href="a00592.html#a4451d237f1cd18c4982d63fe36a11fc3">bottom</a>() +
 
355
<a name="l00253"></a>00253                 blob_box.<a class="code" href="a00592.html#adf92e9fdac1bdf11c10d1c4d1178791a">top</a>() + blob_box.<a class="code" href="a00592.html#a4451d237f1cd18c4982d63fe36a11fc3">bottom</a>()) / 4;
 
356
<a name="l00254"></a>00254   <span class="comment">// Move the word2 seams onto the end of the word1 seam_array.</span>
 
357
<a name="l00255"></a>00255   <span class="comment">// Since the seam list is one element short, an empty seam marking the</span>
 
358
<a name="l00256"></a>00256   <span class="comment">// end of the last blob in the first word is needed first.</span>
 
359
<a name="l00257"></a>00257   word-&gt;<a class="code" href="a00650.html#a3d0de828a382a88581dafb5a304141f1">seam_array</a>.<a class="code" href="a00403.html#a0dc89fe2a365b04a61017f9d78c1a303">push_back</a>(<span class="keyword">new</span> <a class="code" href="a00533.html">SEAM</a>(0.0f, split_pt, NULL, NULL, NULL));
 
360
<a name="l00258"></a>00258   word-&gt;<a class="code" href="a00650.html#a3d0de828a382a88581dafb5a304141f1">seam_array</a> += word2-&gt;<a class="code" href="a00650.html#a3d0de828a382a88581dafb5a304141f1">seam_array</a>;
 
361
<a name="l00259"></a>00259   word2-&gt;<a class="code" href="a00650.html#a3d0de828a382a88581dafb5a304141f1">seam_array</a>.<a class="code" href="a00403.html#a980882b5ebc3e72fdedbdbe345196f21">truncate</a>(0);
 
362
<a name="l00260"></a>00260   <span class="comment">// Fix widths and gaps.</span>
 
363
<a name="l00261"></a>00261   word-&gt;<a class="code" href="a00650.html#a3aeb8deef67c5383e1a116049b994be4">blob_widths</a> += word2-&gt;<a class="code" href="a00650.html#a3aeb8deef67c5383e1a116049b994be4">blob_widths</a>;
 
364
<a name="l00262"></a>00262   word-&gt;<a class="code" href="a00650.html#ae75c16786fddc82649dcbe6febeb1431">blob_gaps</a> += word2-&gt;<a class="code" href="a00650.html#ae75c16786fddc82649dcbe6febeb1431">blob_gaps</a>;
 
365
<a name="l00263"></a>00263   <span class="comment">// Fix the ratings matrix.</span>
 
366
<a name="l00264"></a>00264   <span class="keywordtype">int</span> rat1 = word-&gt;<a class="code" href="a00650.html#af7454f140688a32b2bebb60ab36e91ee">ratings</a>-&gt;<a class="code" href="a00264.html#a82cbdd8a6eb23048b3d1cb656d34a364">dimension</a>();
 
367
<a name="l00265"></a>00265   <span class="keywordtype">int</span> rat2 = word2-&gt;<a class="code" href="a00650.html#af7454f140688a32b2bebb60ab36e91ee">ratings</a>-&gt;<a class="code" href="a00264.html#a82cbdd8a6eb23048b3d1cb656d34a364">dimension</a>();
 
368
<a name="l00266"></a>00266   word-&gt;<a class="code" href="a00650.html#af7454f140688a32b2bebb60ab36e91ee">ratings</a>-&gt;<a class="code" href="a00264.html#a120f2a3063e95bc9ffdcbc4209ee149d">AttachOnCorner</a>(word2-&gt;<a class="code" href="a00650.html#af7454f140688a32b2bebb60ab36e91ee">ratings</a>);
 
369
<a name="l00267"></a>00267   <a class="code" href="a00823.html#a93a603f4063a6b9403d81caa245a583b">ASSERT_HOST</a>(word-&gt;<a class="code" href="a00650.html#af7454f140688a32b2bebb60ab36e91ee">ratings</a>-&gt;<a class="code" href="a00264.html#a82cbdd8a6eb23048b3d1cb656d34a364">dimension</a>() == rat1 + rat2);
 
370
<a name="l00268"></a>00268   word-&gt;<a class="code" href="a00650.html#ab3c9354a32a99c3283f4ac411b5f9b93">best_state</a> += word2-&gt;<a class="code" href="a00650.html#ab3c9354a32a99c3283f4ac411b5f9b93">best_state</a>;
 
371
<a name="l00269"></a>00269   <span class="comment">// Append the word choices.</span>
 
372
<a name="l00270"></a>00270   *word-&gt;<a class="code" href="a00650.html#ab4d02a7548dab0a4522f02ed90e48100">raw_choice</a> += *word2-&gt;<a class="code" href="a00650.html#ab4d02a7548dab0a4522f02ed90e48100">raw_choice</a>;
 
373
<a name="l00271"></a>00271 
 
374
<a name="l00272"></a>00272   <span class="comment">// How many alt choices from each should we try to get?</span>
 
375
<a name="l00273"></a>00273   <span class="keyword">const</span> <span class="keywordtype">int</span> kAltsPerPiece = 2;
 
376
<a name="l00274"></a>00274   <span class="comment">// When do we start throwing away extra alt choices?</span>
 
377
<a name="l00275"></a>00275   <span class="keyword">const</span> <span class="keywordtype">int</span> kTooManyAltChoices = 100;
 
378
<a name="l00276"></a>00276 
 
379
<a name="l00277"></a>00277   <span class="comment">// Construct the cartesian product of the best_choices of word(1) and word2.</span>
 
380
<a name="l00278"></a>00278   WERD_CHOICE_LIST joined_choices;
 
381
<a name="l00279"></a>00279   WERD_CHOICE_IT jc_it(&amp;joined_choices);
 
382
<a name="l00280"></a>00280   WERD_CHOICE_IT bc1_it(&amp;word-&gt;<a class="code" href="a00650.html#a23445f9e8dce6db8902504c0fe1d2e37">best_choices</a>);
 
383
<a name="l00281"></a>00281   WERD_CHOICE_IT bc2_it(&amp;word2-&gt;<a class="code" href="a00650.html#a23445f9e8dce6db8902504c0fe1d2e37">best_choices</a>);
 
384
<a name="l00282"></a>00282   <span class="keywordtype">int</span> num_word1_choices = word-&gt;<a class="code" href="a00650.html#a23445f9e8dce6db8902504c0fe1d2e37">best_choices</a>.length();
 
385
<a name="l00283"></a>00283   <span class="keywordtype">int</span> total_joined_choices = num_word1_choices;
 
386
<a name="l00284"></a>00284   <span class="comment">// Nota Bene: For the main loop here, we operate only on the 2nd and greater</span>
 
387
<a name="l00285"></a>00285   <span class="comment">// word2 choices, and put them in the joined_choices list. The 1st word2</span>
 
388
<a name="l00286"></a>00286   <span class="comment">// choice gets added to the original word1 choices in-place after we have</span>
 
389
<a name="l00287"></a>00287   <span class="comment">// finished with them.</span>
 
390
<a name="l00288"></a>00288   <span class="keywordtype">int</span> bc2_index = 1;
 
391
<a name="l00289"></a>00289   <span class="keywordflow">for</span> (bc2_it.forward(); !bc2_it.at_first(); bc2_it.forward(), ++bc2_index) {
 
392
<a name="l00290"></a>00290     <span class="keywordflow">if</span> (total_joined_choices &gt;= kTooManyAltChoices &amp;&amp;
 
393
<a name="l00291"></a>00291         bc2_index &gt; kAltsPerPiece)
 
394
<a name="l00292"></a>00292       <span class="keywordflow">break</span>;
 
395
<a name="l00293"></a>00293     <span class="keywordtype">int</span> bc1_index = 0;
 
396
<a name="l00294"></a>00294     <span class="keywordflow">for</span> (bc1_it.move_to_first(); bc1_index &lt; num_word1_choices;
 
397
<a name="l00295"></a>00295         ++bc1_index, bc1_it.forward()) {
 
398
<a name="l00296"></a>00296       <span class="keywordflow">if</span> (total_joined_choices &gt;= kTooManyAltChoices &amp;&amp;
 
399
<a name="l00297"></a>00297           bc1_index &gt; kAltsPerPiece)
 
400
<a name="l00298"></a>00298         <span class="keywordflow">break</span>;
 
401
<a name="l00299"></a>00299       <a class="code" href="a00649.html">WERD_CHOICE</a> *wc = <span class="keyword">new</span> <a class="code" href="a00649.html">WERD_CHOICE</a>(*bc1_it.data());
 
402
<a name="l00300"></a>00300       *wc += *bc2_it.data();
 
403
<a name="l00301"></a>00301       jc_it.add_after_then_move(wc);
 
404
<a name="l00302"></a>00302       ++total_joined_choices;
 
405
<a name="l00303"></a>00303     }
 
406
<a name="l00304"></a>00304   }
 
407
<a name="l00305"></a>00305   <span class="comment">// Now that we&#39;ve filled in as many alternates as we want, paste the best</span>
 
408
<a name="l00306"></a>00306   <span class="comment">// choice for word2 onto the original word alt_choices.</span>
 
409
<a name="l00307"></a>00307   bc1_it.move_to_first();
 
410
<a name="l00308"></a>00308   bc2_it.move_to_first();
 
411
<a name="l00309"></a>00309   <span class="keywordflow">for</span> (bc1_it.mark_cycle_pt(); !bc1_it.cycled_list(); bc1_it.forward()) {
 
412
<a name="l00310"></a>00310     *bc1_it.data() += *bc2_it.data();
 
413
<a name="l00311"></a>00311   }
 
414
<a name="l00312"></a>00312   bc1_it.move_to_last();
 
415
<a name="l00313"></a>00313   bc1_it.add_list_after(&amp;joined_choices);
 
416
<a name="l00314"></a>00314 
 
417
<a name="l00315"></a>00315   <span class="comment">// Restore the pointer to original blamer bundle and combine blamer</span>
 
418
<a name="l00316"></a>00316   <span class="comment">// information recorded in the splits.</span>
 
419
<a name="l00317"></a>00317   <span class="keywordflow">if</span> (orig_bb != NULL) {
 
420
<a name="l00318"></a>00318     orig_bb-&gt;<a class="code" href="a00274.html#a61e027f96d2d14b05dee51596ee75022">JoinBlames</a>(*word-&gt;<a class="code" href="a00650.html#a267e5d5e9fe67117e47223c5d336b8ba">blamer_bundle</a>, *word2-&gt;<a class="code" href="a00650.html#a267e5d5e9fe67117e47223c5d336b8ba">blamer_bundle</a>,
 
421
<a name="l00319"></a>00319                         <a class="code" href="a00655.html#a76e95cb7cbfe636ab00ec46150b5524d">wordrec_debug_blamer</a>);
 
422
<a name="l00320"></a>00320     <span class="keyword">delete</span> word-&gt;<a class="code" href="a00650.html#a267e5d5e9fe67117e47223c5d336b8ba">blamer_bundle</a>;
 
423
<a name="l00321"></a>00321     word-&gt;<a class="code" href="a00650.html#a267e5d5e9fe67117e47223c5d336b8ba">blamer_bundle</a> = orig_bb;
 
424
<a name="l00322"></a>00322   }
 
425
<a name="l00323"></a>00323   word-&gt;<a class="code" href="a00650.html#a6efe07c079a04a91985f99c71258a193">SetupBoxWord</a>();
 
426
<a name="l00324"></a>00324   word-&gt;<a class="code" href="a00650.html#ae24eb58be06cf275aee411d947fd31ef">reject_map</a>.<a class="code" href="a00517.html#a487e7d5d02b1fd1e142578ab4614f05b">initialise</a>(word-&gt;<a class="code" href="a00650.html#a3a92c8c9750d78631d75998f008f366a">box_word</a>-&gt;<a class="code" href="a00287.html#afe001fe8fb7f2d3725b2ac2f542e9878">length</a>());
 
427
<a name="l00325"></a>00325   <span class="keyword">delete</span> word2;
 
428
<a name="l00326"></a>00326 }
 
429
<a name="l00327"></a>00327 
 
430
<a name="l00328"></a>00328 
 
431
<a name="l00329"></a>00329 }  <span class="comment">// namespace tesseract</span>
 
432
</pre></div></div><!-- contents -->
 
433
</div>
 
434
<!-- window showing the filter options -->
 
435
<div id="MSearchSelectWindow"
 
436
     onmouseover="return searchBox.OnSearchSelectShow()"
 
437
     onmouseout="return searchBox.OnSearchSelectHide()"
 
438
     onkeydown="return searchBox.OnSearchSelectKey(event)">
 
439
<a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(0)"><span class="SelectionMark">&#160;</span>All</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(1)"><span class="SelectionMark">&#160;</span>Classes</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(2)"><span class="SelectionMark">&#160;</span>Namespaces</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(3)"><span class="SelectionMark">&#160;</span>Files</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(4)"><span class="SelectionMark">&#160;</span>Functions</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(5)"><span class="SelectionMark">&#160;</span>Variables</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(6)"><span class="SelectionMark">&#160;</span>Typedefs</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(7)"><span class="SelectionMark">&#160;</span>Enumerations</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(8)"><span class="SelectionMark">&#160;</span>Enumerator</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(9)"><span class="SelectionMark">&#160;</span>Friends</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(10)"><span class="SelectionMark">&#160;</span>Defines</a></div>
 
440
 
 
441
<!-- iframe showing the search results (closed by default) -->
 
442
<div id="MSearchResultsWindow">
 
443
<iframe src="javascript:void(0)" frameborder="0" 
 
444
        name="MSearchResults" id="MSearchResults">
 
445
</iframe>
 
446
</div>
 
447
 
 
448
  <div id="nav-path" class="navpath">
 
449
    <ul>
 
450
      <li class="navelem"><a class="el" href="a00719.html">tfacepp.cpp</a>      </li>
 
451
 
 
452
    <li class="footer">Generated on Mon Feb 3 2014 10:59:07 for tesseract by
 
453
    <a href="http://www.doxygen.org/index.html">
 
454
    <img class="footer" src="doxygen.png" alt="doxygen"/></a> 1.7.6.1 </li>
 
455
   </ul>
 
456
 </div>
 
457
 
 
458
 
 
459
</body>
 
460
</html>