~ubuntu-branches/ubuntu/vivid/tesseract/vivid

« back to all changes in this revision

Viewing changes to doc/html/a00687_source.html

  • Committer: Package Import Robot
  • Author(s): Jeff Breidenbach
  • Date: 2014-02-03 11:10:20 UTC
  • mfrom: (1.3.1) (19.1.1 experimental)
  • Revision ID: package-import@ubuntu.com-20140203111020-igquodd7pjlp3uri
Tags: 3.03.01-1
* New upstream release, includes critical fix to PDF rendering
* Complete leptonlib transition (see bug #735509)
* Promote from experimental to unstable

Show diffs side-by-side

added added

removed removed

Lines of Context:
 
1
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
 
2
<html xmlns="http://www.w3.org/1999/xhtml">
 
3
<head>
 
4
<meta http-equiv="Content-Type" content="text/xhtml;charset=UTF-8"/>
 
5
<meta http-equiv="X-UA-Compatible" content="IE=9"/>
 
6
<title>tesseract: /usr/local/google/home/jbreiden/tesseract-ocr-read-only/ccmain/osdetect.cpp Source File</title>
 
7
 
 
8
<link href="tabs.css" rel="stylesheet" type="text/css"/>
 
9
<link href="doxygen.css" rel="stylesheet" type="text/css" />
 
10
<link href="navtree.css" rel="stylesheet" type="text/css"/>
 
11
<script type="text/javascript" src="jquery.js"></script>
 
12
<script type="text/javascript" src="resize.js"></script>
 
13
<script type="text/javascript" src="navtree.js"></script>
 
14
<script type="text/javascript">
 
15
  $(document).ready(initResizable);
 
16
</script>
 
17
<link href="search/search.css" rel="stylesheet" type="text/css"/>
 
18
<script type="text/javascript" src="search/search.js"></script>
 
19
<script type="text/javascript">
 
20
  $(document).ready(function() { searchBox.OnSelectItem(0); });
 
21
</script>
 
22
 
 
23
</head>
 
24
<body>
 
25
<div id="top"><!-- do not remove this div! -->
 
26
 
 
27
 
 
28
<div id="titlearea">
 
29
<table cellspacing="0" cellpadding="0">
 
30
 <tbody>
 
31
 <tr style="height: 56px;">
 
32
  
 
33
  
 
34
  <td style="padding-left: 0.5em;">
 
35
   <div id="projectname">tesseract
 
36
   &#160;<span id="projectnumber">3.03</span>
 
37
   </div>
 
38
   
 
39
  </td>
 
40
  
 
41
  
 
42
  
 
43
 </tr>
 
44
 </tbody>
 
45
</table>
 
46
</div>
 
47
 
 
48
<!-- Generated by Doxygen 1.7.6.1 -->
 
49
<script type="text/javascript">
 
50
var searchBox = new SearchBox("searchBox", "search",false,'Search');
 
51
</script>
 
52
  <div id="navrow1" class="tabs">
 
53
    <ul class="tablist">
 
54
      <li><a href="index.html"><span>Main&#160;Page</span></a></li>
 
55
      <li><a href="pages.html"><span>Related&#160;Pages</span></a></li>
 
56
      <li><a href="modules.html"><span>Modules</span></a></li>
 
57
      <li><a href="namespaces.html"><span>Namespaces</span></a></li>
 
58
      <li><a href="annotated.html"><span>Classes</span></a></li>
 
59
      <li class="current"><a href="files.html"><span>Files</span></a></li>
 
60
      <li>
 
61
        <div id="MSearchBox" class="MSearchBoxInactive">
 
62
        <span class="left">
 
63
          <img id="MSearchSelect" src="search/mag_sel.png"
 
64
               onmouseover="return searchBox.OnSearchSelectShow()"
 
65
               onmouseout="return searchBox.OnSearchSelectHide()"
 
66
               alt=""/>
 
67
          <input type="text" id="MSearchField" value="Search" accesskey="S"
 
68
               onfocus="searchBox.OnSearchFieldFocus(true)" 
 
69
               onblur="searchBox.OnSearchFieldFocus(false)" 
 
70
               onkeyup="searchBox.OnSearchFieldChange(event)"/>
 
71
          </span><span class="right">
 
72
            <a id="MSearchClose" href="javascript:searchBox.CloseResultsWindow()"><img id="MSearchCloseImg" border="0" src="search/close.png" alt=""/></a>
 
73
          </span>
 
74
        </div>
 
75
      </li>
 
76
    </ul>
 
77
  </div>
 
78
  <div id="navrow2" class="tabs2">
 
79
    <ul class="tablist">
 
80
      <li><a href="files.html"><span>File&#160;List</span></a></li>
 
81
      <li><a href="globals.html"><span>File&#160;Members</span></a></li>
 
82
    </ul>
 
83
  </div>
 
84
</div>
 
85
<div id="side-nav" class="ui-resizable side-nav-resizable">
 
86
  <div id="nav-tree">
 
87
    <div id="nav-tree-contents">
 
88
    </div>
 
89
  </div>
 
90
  <div id="splitbar" style="-moz-user-select:none;" 
 
91
       class="ui-resizable-handle">
 
92
  </div>
 
93
</div>
 
94
<script type="text/javascript">
 
95
  initNavTree('a00687.html','');
 
96
</script>
 
97
<div id="doc-content">
 
98
<div class="header">
 
99
  <div class="headertitle">
 
100
<div class="title">/usr/local/google/home/jbreiden/tesseract-ocr-read-only/ccmain/osdetect.cpp</div>  </div>
 
101
</div><!--header-->
 
102
<div class="contents">
 
103
<a href="a00687.html">Go to the documentation of this file.</a><div class="fragment"><pre class="fragment"><a name="l00001"></a>00001 
 
104
<a name="l00002"></a>00002 <span class="comment">// File:        osdetect.cpp</span>
 
105
<a name="l00003"></a>00003 <span class="comment">// Description: Orientation and script detection.</span>
 
106
<a name="l00004"></a>00004 <span class="comment">// Author:      Samuel Charron</span>
 
107
<a name="l00005"></a>00005 <span class="comment">//              Ranjith Unnikrishnan</span>
 
108
<a name="l00006"></a>00006 <span class="comment">//</span>
 
109
<a name="l00007"></a>00007 <span class="comment">// (C) Copyright 2008, Google Inc.</span>
 
110
<a name="l00008"></a>00008 <span class="comment">// Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);</span>
 
111
<a name="l00009"></a>00009 <span class="comment">// you may not use this file except in compliance with the License.</span>
 
112
<a name="l00010"></a>00010 <span class="comment">// You may obtain a copy of the License at</span>
 
113
<a name="l00011"></a>00011 <span class="comment">// http://www.apache.org/licenses/LICENSE-2.0</span>
 
114
<a name="l00012"></a>00012 <span class="comment">// Unless required by applicable law or agreed to in writing, software</span>
 
115
<a name="l00013"></a>00013 <span class="comment">// distributed under the License is distributed on an &quot;AS IS&quot; BASIS,</span>
 
116
<a name="l00014"></a>00014 <span class="comment">// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.</span>
 
117
<a name="l00015"></a>00015 <span class="comment">// See the License for the specific language governing permissions and</span>
 
118
<a name="l00016"></a>00016 <span class="comment">// limitations under the License.</span>
 
119
<a name="l00017"></a>00017 <span class="comment">//</span>
 
120
<a name="l00019"></a>00019 <span class="comment"></span>
 
121
<a name="l00020"></a>00020 <span class="preprocessor">#include &quot;<a class="code" href="a00688.html">osdetect.h</a>&quot;</span>
 
122
<a name="l00021"></a>00021 
 
123
<a name="l00022"></a>00022 <span class="preprocessor">#include &quot;<a class="code" href="a00728.html">blobbox.h</a>&quot;</span>
 
124
<a name="l00023"></a>00023 <span class="preprocessor">#include &quot;<a class="code" href="a00732.html">blread.h</a>&quot;</span>
 
125
<a name="l00024"></a>00024 <span class="preprocessor">#include &quot;<a class="code" href="a01099.html">colfind.h</a>&quot;</span>
 
126
<a name="l00025"></a>00025 <span class="preprocessor">#include &quot;<a class="code" href="a00747.html">fontinfo.h</a>&quot;</span>
 
127
<a name="l00026"></a>00026 <span class="preprocessor">#include &quot;<a class="code" href="a01123.html">imagefind.h</a>&quot;</span>
 
128
<a name="l00027"></a>00027 <span class="preprocessor">#include &quot;<a class="code" href="a01125.html">linefind.h</a>&quot;</span>
 
129
<a name="l00028"></a>00028 <span class="preprocessor">#include &quot;<a class="code" href="a01043.html">oldlist.h</a>&quot;</span>
 
130
<a name="l00029"></a>00029 <span class="preprocessor">#include &quot;<a class="code" href="a00846.html">qrsequence.h</a>&quot;</span>
 
131
<a name="l00030"></a>00030 <span class="preprocessor">#include &quot;<a class="code" href="a00788.html">ratngs.h</a>&quot;</span>
 
132
<a name="l00031"></a>00031 <span class="preprocessor">#include &quot;<a class="code" href="a00855.html">strngs.h</a>&quot;</span>
 
133
<a name="l00032"></a>00032 <span class="preprocessor">#include &quot;<a class="code" href="a01147.html">tabvector.h</a>&quot;</span>
 
134
<a name="l00033"></a>00033 <span class="preprocessor">#include &quot;<a class="code" href="a00716.html">tesseractclass.h</a>&quot;</span>
 
135
<a name="l00034"></a>00034 <span class="preprocessor">#include &quot;<a class="code" href="a01151.html">textord.h</a>&quot;</span>
 
136
<a name="l00035"></a>00035 
 
137
<a name="l00036"></a><a class="code" href="a00687.html#a1dcbb4454cb6c97be113fc6ae820c958">00036</a> <span class="keyword">const</span> <span class="keywordtype">int</span> <a class="code" href="a00687.html#a1dcbb4454cb6c97be113fc6ae820c958">kMinCharactersToTry</a> = 50;
 
138
<a name="l00037"></a><a class="code" href="a00687.html#ab1eb3d41a8092b2cc34e2c1d17886521">00037</a> <span class="keyword">const</span> <span class="keywordtype">int</span> <a class="code" href="a00687.html#ab1eb3d41a8092b2cc34e2c1d17886521">kMaxCharactersToTry</a> = 5 * <a class="code" href="a00687.html#a1dcbb4454cb6c97be113fc6ae820c958">kMinCharactersToTry</a>;
 
139
<a name="l00038"></a>00038 
 
140
<a name="l00039"></a><a class="code" href="a00687.html#ac23eec99b25d1c109fb6ee2590a331bf">00039</a> <span class="keyword">const</span> <span class="keywordtype">float</span> <a class="code" href="a00687.html#ac23eec99b25d1c109fb6ee2590a331bf">kSizeRatioToReject</a> = 2.0;
 
141
<a name="l00040"></a><a class="code" href="a00687.html#aaba53b59683a4788881c7b8281f25fac">00040</a> <span class="keyword">const</span> <span class="keywordtype">int</span> <a class="code" href="a00687.html#aaba53b59683a4788881c7b8281f25fac">kMinAcceptableBlobHeight</a> = 10;
 
142
<a name="l00041"></a>00041 
 
143
<a name="l00042"></a><a class="code" href="a00687.html#ad58ecd1e0aa2241ba3ccd5d0398c1e5c">00042</a> <span class="keyword">const</span> <span class="keywordtype">float</span> <a class="code" href="a00687.html#ad58ecd1e0aa2241ba3ccd5d0398c1e5c">kOrientationAcceptRatio</a> = 1.3;
 
144
<a name="l00043"></a><a class="code" href="a00687.html#a448b61b7951bc14ffab3cc00ba37aadd">00043</a> <span class="keyword">const</span> <span class="keywordtype">float</span> <a class="code" href="a00687.html#a448b61b7951bc14ffab3cc00ba37aadd">kScriptAcceptRatio</a> = 1.3;
 
145
<a name="l00044"></a>00044 
 
146
<a name="l00045"></a><a class="code" href="a00687.html#ae3f12edb58f6ed0a11daea2cbf8dc547">00045</a> <span class="keyword">const</span> <span class="keywordtype">float</span> <a class="code" href="a00687.html#ae3f12edb58f6ed0a11daea2cbf8dc547">kHanRatioInKorean</a> = 0.7;
 
147
<a name="l00046"></a><a class="code" href="a00687.html#aab3b7e76eea520b1e4b9d68165e3a094">00046</a> <span class="keyword">const</span> <span class="keywordtype">float</span> <a class="code" href="a00687.html#aab3b7e76eea520b1e4b9d68165e3a094">kHanRatioInJapanese</a> = 0.3;
 
148
<a name="l00047"></a>00047 
 
149
<a name="l00048"></a><a class="code" href="a00687.html#a14c7913eafbd3237afbdd7c6b498b2d8">00048</a> <span class="keyword">const</span> <span class="keywordtype">float</span> <a class="code" href="a00687.html#a14c7913eafbd3237afbdd7c6b498b2d8">kNonAmbiguousMargin</a> = 1.0;
 
150
<a name="l00049"></a>00049 
 
151
<a name="l00050"></a>00050 <span class="comment">// General scripts</span>
 
152
<a name="l00051"></a>00051 <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">char</span>* han_script = <span class="stringliteral">&quot;Han&quot;</span>;
 
153
<a name="l00052"></a>00052 <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">char</span>* latin_script = <span class="stringliteral">&quot;Latin&quot;</span>;
 
154
<a name="l00053"></a>00053 <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">char</span>* katakana_script = <span class="stringliteral">&quot;Katakana&quot;</span>;
 
155
<a name="l00054"></a>00054 <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">char</span>* hiragana_script = <span class="stringliteral">&quot;Hiragana&quot;</span>;
 
156
<a name="l00055"></a>00055 <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">char</span>* hangul_script = <span class="stringliteral">&quot;Hangul&quot;</span>;
 
157
<a name="l00056"></a>00056 
 
158
<a name="l00057"></a>00057 <span class="comment">// Pseudo-scripts Name</span>
 
159
<a name="l00058"></a>00058 <span class="keyword">const</span> <span class="keywordtype">char</span>* ScriptDetector::korean_script_ = <span class="stringliteral">&quot;Korean&quot;</span>;
 
160
<a name="l00059"></a>00059 <span class="keyword">const</span> <span class="keywordtype">char</span>* ScriptDetector::japanese_script_ = <span class="stringliteral">&quot;Japanese&quot;</span>;
 
161
<a name="l00060"></a>00060 <span class="keyword">const</span> <span class="keywordtype">char</span>* ScriptDetector::fraktur_script_ = <span class="stringliteral">&quot;Fraktur&quot;</span>;
 
162
<a name="l00061"></a>00061 
 
163
<a name="l00062"></a>00062 <span class="comment">// Minimum believable resolution.</span>
 
164
<a name="l00063"></a><a class="code" href="a00687.html#af9f4de4278c712c02788092501b587f3">00063</a> <span class="keyword">const</span> <span class="keywordtype">int</span> <a class="code" href="a00687.html#af9f4de4278c712c02788092501b587f3">kMinCredibleResolution</a> = 70;
 
165
<a name="l00064"></a>00064 <span class="comment">// Default resolution used if input is not believable.</span>
 
166
<a name="l00065"></a><a class="code" href="a00687.html#ad3674a322dd444a002052c5b929b1976">00065</a> <span class="keyword">const</span> <span class="keywordtype">int</span> <a class="code" href="a00687.html#ad3674a322dd444a002052c5b929b1976">kDefaultResolution</a> = 300;
 
167
<a name="l00066"></a>00066 
 
168
<a name="l00067"></a><a class="code" href="a00478.html#af7b5cea89a2bdace52ad5825d6d5d4e6">00067</a> <span class="keywordtype">void</span> <a class="code" href="a00478.html#af7b5cea89a2bdace52ad5825d6d5d4e6">OSResults::update_best_orientation</a>() {
 
169
<a name="l00068"></a>00068   <span class="keywordtype">float</span> first = <a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[0];
 
170
<a name="l00069"></a>00069   <span class="keywordtype">float</span> second = <a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[1];
 
171
<a name="l00070"></a>00070   <a class="code" href="a00478.html#a25f64011ea65c038c1ef1a6cedd10f1c">best_result</a>.<a class="code" href="a00477.html#a6dfb6826b41a81524ce867b005ba5641">orientation_id</a> = 0;
 
172
<a name="l00071"></a>00071   <span class="keywordflow">if</span> (<a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[0] &lt; <a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[1]) {
 
173
<a name="l00072"></a>00072     first = <a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[1];
 
174
<a name="l00073"></a>00073     second = <a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[0];
 
175
<a name="l00074"></a>00074     <a class="code" href="a00478.html#a25f64011ea65c038c1ef1a6cedd10f1c">best_result</a>.<a class="code" href="a00477.html#a6dfb6826b41a81524ce867b005ba5641">orientation_id</a> = 1;
 
176
<a name="l00075"></a>00075   }
 
177
<a name="l00076"></a>00076   <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 2; i &lt; 4; ++i) {
 
178
<a name="l00077"></a>00077     <span class="keywordflow">if</span> (<a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[i] &gt; first) {
 
179
<a name="l00078"></a>00078       second = first;
 
180
<a name="l00079"></a>00079       first = <a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[i];
 
181
<a name="l00080"></a>00080       <a class="code" href="a00478.html#a25f64011ea65c038c1ef1a6cedd10f1c">best_result</a>.<a class="code" href="a00477.html#a6dfb6826b41a81524ce867b005ba5641">orientation_id</a> = i;
 
182
<a name="l00081"></a>00081     } <span class="keywordflow">else</span> <span class="keywordflow">if</span> (<a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[i] &gt; second) {
 
183
<a name="l00082"></a>00082       second = <a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[i];
 
184
<a name="l00083"></a>00083     }
 
185
<a name="l00084"></a>00084   }
 
186
<a name="l00085"></a>00085   <span class="comment">// Store difference of top two orientation scores.</span>
 
187
<a name="l00086"></a>00086   <a class="code" href="a00478.html#a25f64011ea65c038c1ef1a6cedd10f1c">best_result</a>.<a class="code" href="a00477.html#a67e009467e4db6c40777548ffdfe464e">oconfidence</a> = first - second;
 
188
<a name="l00087"></a>00087 }
 
189
<a name="l00088"></a>00088 
 
190
<a name="l00089"></a><a class="code" href="a00478.html#aa13f0e8c136d10e0af341f163951ed3d">00089</a> <span class="keywordtype">void</span> <a class="code" href="a00478.html#aa13f0e8c136d10e0af341f163951ed3d">OSResults::set_best_orientation</a>(<span class="keywordtype">int</span> orientation_id) {
 
191
<a name="l00090"></a>00090   <a class="code" href="a00478.html#a25f64011ea65c038c1ef1a6cedd10f1c">best_result</a>.<a class="code" href="a00477.html#a6dfb6826b41a81524ce867b005ba5641">orientation_id</a> = orientation_id;
 
192
<a name="l00091"></a>00091   <a class="code" href="a00478.html#a25f64011ea65c038c1ef1a6cedd10f1c">best_result</a>.<a class="code" href="a00477.html#a67e009467e4db6c40777548ffdfe464e">oconfidence</a> = 0;
 
193
<a name="l00092"></a>00092 }
 
194
<a name="l00093"></a>00093 
 
195
<a name="l00094"></a><a class="code" href="a00478.html#ab796da60cc16d39f464c03fe4047c358">00094</a> <span class="keywordtype">void</span> <a class="code" href="a00478.html#ab796da60cc16d39f464c03fe4047c358">OSResults::update_best_script</a>(<span class="keywordtype">int</span> orientation) {
 
196
<a name="l00095"></a>00095   <span class="comment">// We skip index 0 to ignore the &quot;Common&quot; script.</span>
 
197
<a name="l00096"></a>00096   <span class="keywordtype">float</span> first = <a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation][1];
 
198
<a name="l00097"></a>00097   <span class="keywordtype">float</span> second = <a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation][2];
 
199
<a name="l00098"></a>00098   <a class="code" href="a00478.html#a25f64011ea65c038c1ef1a6cedd10f1c">best_result</a>.<a class="code" href="a00477.html#a0647ea3dc4a399a472c48ab1eacd31e1">script_id</a> = 1;
 
200
<a name="l00099"></a>00099   <span class="keywordflow">if</span> (<a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation][1] &lt; <a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation][2]) {
 
201
<a name="l00100"></a>00100     first = <a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation][2];
 
202
<a name="l00101"></a>00101     second = <a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation][1];
 
203
<a name="l00102"></a>00102     <a class="code" href="a00478.html#a25f64011ea65c038c1ef1a6cedd10f1c">best_result</a>.<a class="code" href="a00477.html#a0647ea3dc4a399a472c48ab1eacd31e1">script_id</a> = 2;
 
204
<a name="l00103"></a>00103   }
 
205
<a name="l00104"></a>00104   <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 3; i &lt; <a class="code" href="a00688.html#ab52d878a730b63bcf57d7bb3113882a1">kMaxNumberOfScripts</a>; ++i) {
 
206
<a name="l00105"></a>00105     <span class="keywordflow">if</span> (<a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation][i] &gt; first) {
 
207
<a name="l00106"></a>00106       <a class="code" href="a00478.html#a25f64011ea65c038c1ef1a6cedd10f1c">best_result</a>.<a class="code" href="a00477.html#a0647ea3dc4a399a472c48ab1eacd31e1">script_id</a> = i;
 
208
<a name="l00107"></a>00107       second = first;
 
209
<a name="l00108"></a>00108       first = <a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation][i];
 
210
<a name="l00109"></a>00109     } <span class="keywordflow">else</span> <span class="keywordflow">if</span> (<a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation][i] &gt; second) {
 
211
<a name="l00110"></a>00110       second = <a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation][i];
 
212
<a name="l00111"></a>00111     }
 
213
<a name="l00112"></a>00112   }
 
214
<a name="l00113"></a>00113   <a class="code" href="a00478.html#a25f64011ea65c038c1ef1a6cedd10f1c">best_result</a>.<a class="code" href="a00477.html#ae39a2c718b010ed27eb7f820546da6d6">sconfidence</a> =
 
215
<a name="l00114"></a>00114       (first / second - 1.0) / (<a class="code" href="a00687.html#a448b61b7951bc14ffab3cc00ba37aadd">kScriptAcceptRatio</a> - 1.0);
 
216
<a name="l00115"></a>00115 }
 
217
<a name="l00116"></a>00116 
 
218
<a name="l00117"></a><a class="code" href="a00478.html#a9dcb5250ae2466116c33f5d220223296">00117</a> <span class="keywordtype">int</span> <a class="code" href="a00478.html#a9dcb5250ae2466116c33f5d220223296">OSResults::get_best_script</a>(<span class="keywordtype">int</span> orientation_id)<span class="keyword"> const </span>{
 
219
<a name="l00118"></a>00118   <span class="keywordtype">int</span> max_id = -1;
 
220
<a name="l00119"></a>00119   <span class="keywordflow">for</span> (<span class="keywordtype">int</span> j = 0; j &lt; <a class="code" href="a00688.html#ab52d878a730b63bcf57d7bb3113882a1">kMaxNumberOfScripts</a>; ++j) {
 
221
<a name="l00120"></a>00120     <span class="keyword">const</span> <span class="keywordtype">char</span> *script = <a class="code" href="a00478.html#a78ebdae52f3c685095b56790598ad97c">unicharset</a>-&gt;<a class="code" href="a00642.html#a4fc0f6815e2091efedcff7ab6183d19a">get_script_from_script_id</a>(j);
 
222
<a name="l00121"></a>00121     <span class="keywordflow">if</span> (strcmp(script, <span class="stringliteral">&quot;Common&quot;</span>) &amp;&amp; strcmp(script, <span class="stringliteral">&quot;NULL&quot;</span>)) {
 
223
<a name="l00122"></a>00122       <span class="keywordflow">if</span> (max_id == -1 ||
 
224
<a name="l00123"></a>00123           <a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation_id][j] &gt; <a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation_id][max_id])
 
225
<a name="l00124"></a>00124         max_id = j;
 
226
<a name="l00125"></a>00125     }
 
227
<a name="l00126"></a>00126   }
 
228
<a name="l00127"></a>00127   <span class="keywordflow">return</span> max_id;
 
229
<a name="l00128"></a>00128 }
 
230
<a name="l00129"></a>00129 
 
231
<a name="l00130"></a>00130 <span class="comment">// Print the script scores for all possible orientations.</span>
 
232
<a name="l00131"></a><a class="code" href="a00478.html#a4425aefc39fde345cea1288d95691bed">00131</a> <span class="keywordtype">void</span> <a class="code" href="a00478.html#a4425aefc39fde345cea1288d95691bed">OSResults::print_scores</a>(<span class="keywordtype">void</span>)<span class="keyword"> const </span>{
 
233
<a name="l00132"></a>00132   <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 0; i &lt; 4; ++i) {
 
234
<a name="l00133"></a>00133     <a class="code" href="a00860.html#a02aa7cca2c3857c14716e8cca96ace6c">tprintf</a>(<span class="stringliteral">&quot;Orientation id #%d&quot;</span>, i);
 
235
<a name="l00134"></a>00134     <a class="code" href="a00478.html#a4425aefc39fde345cea1288d95691bed">print_scores</a>(i);
 
236
<a name="l00135"></a>00135   }
 
237
<a name="l00136"></a>00136 }
 
238
<a name="l00137"></a>00137 
 
239
<a name="l00138"></a>00138 <span class="comment">// Print the script scores for the given candidate orientation.</span>
 
240
<a name="l00139"></a><a class="code" href="a00478.html#a4c4c5d0fce6889edeea358f755f7e378">00139</a> <span class="keywordtype">void</span> <a class="code" href="a00478.html#a4425aefc39fde345cea1288d95691bed">OSResults::print_scores</a>(<span class="keywordtype">int</span> orientation_id)<span class="keyword"> const </span>{
 
241
<a name="l00140"></a>00140   <span class="keywordflow">for</span> (<span class="keywordtype">int</span> j = 0; j &lt; <a class="code" href="a00688.html#ab52d878a730b63bcf57d7bb3113882a1">kMaxNumberOfScripts</a>; ++j) {
 
242
<a name="l00141"></a>00141     <span class="keywordflow">if</span> (<a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation_id][j]) {
 
243
<a name="l00142"></a>00142       <a class="code" href="a00860.html#a02aa7cca2c3857c14716e8cca96ace6c">tprintf</a>(<span class="stringliteral">&quot;%12s\t: %f\n&quot;</span>, <a class="code" href="a00478.html#a78ebdae52f3c685095b56790598ad97c">unicharset</a>-&gt;<a class="code" href="a00642.html#a4fc0f6815e2091efedcff7ab6183d19a">get_script_from_script_id</a>(j),
 
244
<a name="l00143"></a>00143              <a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation_id][j]);
 
245
<a name="l00144"></a>00144     }
 
246
<a name="l00145"></a>00145   }
 
247
<a name="l00146"></a>00146 }
 
248
<a name="l00147"></a>00147 
 
249
<a name="l00148"></a>00148 <span class="comment">// Accumulate scores with given OSResults instance and update the best script.</span>
 
250
<a name="l00149"></a><a class="code" href="a00478.html#a25b4edef21699b3a367d7978733595be">00149</a> <span class="keywordtype">void</span> <a class="code" href="a00478.html#a25b4edef21699b3a367d7978733595be">OSResults::accumulate</a>(<span class="keyword">const</span> <a class="code" href="a00478.html">OSResults</a>&amp; osr) {
 
251
<a name="l00150"></a>00150   <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 0; i &lt; 4; ++i) {
 
252
<a name="l00151"></a>00151     <a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[i] += osr.<a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[i];
 
253
<a name="l00152"></a>00152     <span class="keywordflow">for</span> (<span class="keywordtype">int</span> j = 0; j &lt; <a class="code" href="a00688.html#ab52d878a730b63bcf57d7bb3113882a1">kMaxNumberOfScripts</a>; ++j)
 
254
<a name="l00153"></a>00153       <a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[i][j] += osr.<a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[i][j];
 
255
<a name="l00154"></a>00154   }
 
256
<a name="l00155"></a>00155   <a class="code" href="a00478.html#a78ebdae52f3c685095b56790598ad97c">unicharset</a> = osr.<a class="code" href="a00478.html#a78ebdae52f3c685095b56790598ad97c">unicharset</a>;
 
257
<a name="l00156"></a>00156   <a class="code" href="a00478.html#af7b5cea89a2bdace52ad5825d6d5d4e6">update_best_orientation</a>();
 
258
<a name="l00157"></a>00157   <a class="code" href="a00478.html#ab796da60cc16d39f464c03fe4047c358">update_best_script</a>(<a class="code" href="a00478.html#a25f64011ea65c038c1ef1a6cedd10f1c">best_result</a>.<a class="code" href="a00477.html#a6dfb6826b41a81524ce867b005ba5641">orientation_id</a>);
 
259
<a name="l00158"></a>00158 }
 
260
<a name="l00159"></a>00159 
 
261
<a name="l00160"></a>00160 <span class="comment">// Detect and erase horizontal/vertical lines and picture regions from the</span>
 
262
<a name="l00161"></a>00161 <span class="comment">// image, so that non-text blobs are removed from consideration.</span>
 
263
<a name="l00162"></a><a class="code" href="a00687.html#a0328b8314a9022034d90c11ac8a0b0ea">00162</a> <span class="keywordtype">void</span> <a class="code" href="a00687.html#a0328b8314a9022034d90c11ac8a0b0ea">remove_nontext_regions</a>(<a class="code" href="a00607.html">tesseract::Tesseract</a> *tess, BLOCK_LIST *blocks,
 
264
<a name="l00163"></a>00163                             TO_BLOCK_LIST *to_blocks) {
 
265
<a name="l00164"></a>00164   Pix *pix = tess-&gt;<a class="code" href="a00607.html#a97fde2a457aa76137737b247a2418cb7">pix_binary</a>();
 
266
<a name="l00165"></a>00165   <a class="code" href="a00823.html#a93a603f4063a6b9403d81caa245a583b">ASSERT_HOST</a>(pix != NULL);
 
267
<a name="l00166"></a>00166   <span class="keywordtype">int</span> vertical_x = 0;
 
268
<a name="l00167"></a>00167   <span class="keywordtype">int</span> vertical_y = 1;
 
269
<a name="l00168"></a>00168   tesseract::TabVector_LIST v_lines;
 
270
<a name="l00169"></a>00169   tesseract::TabVector_LIST h_lines;
 
271
<a name="l00170"></a>00170   <span class="keyword">const</span> <span class="keywordtype">int</span> <a class="code" href="a00687.html#af9f4de4278c712c02788092501b587f3">kMinCredibleResolution</a> = 70;
 
272
<a name="l00171"></a>00171   <span class="keywordtype">int</span> resolution = (kMinCredibleResolution &gt; pixGetXRes(pix)) ?
 
273
<a name="l00172"></a>00172       kMinCredibleResolution : pixGetXRes(pix);
 
274
<a name="l00173"></a>00173 
 
275
<a name="l00174"></a>00174   <a class="code" href="a00451.html#a3a72521c00cb7725b2282b7b3cc6e6b9">tesseract::LineFinder::FindAndRemoveLines</a>(resolution, <span class="keyword">false</span>, pix,
 
276
<a name="l00175"></a>00175                                             &amp;vertical_x, &amp;vertical_y,
 
277
<a name="l00176"></a>00176                                             NULL, &amp;v_lines, &amp;h_lines);
 
278
<a name="l00177"></a>00177   Pix* im_pix = <a class="code" href="a00413.html#af465be1a567090dcaaa74eb7742c51fe">tesseract::ImageFind::FindImages</a>(pix);
 
279
<a name="l00178"></a>00178   <span class="keywordflow">if</span> (im_pix != NULL) {
 
280
<a name="l00179"></a>00179     pixSubtract(pix, pix, im_pix);
 
281
<a name="l00180"></a>00180     pixDestroy(&amp;im_pix);
 
282
<a name="l00181"></a>00181   }
 
283
<a name="l00182"></a>00182   tess-&gt;<a class="code" href="a00607.html#a6fa77152d6fd5c6afe14f2698413d0f9">mutable_textord</a>()-&gt;<a class="code" href="a00625.html#ab478029b49bf4efadd59a547565327a7">find_components</a>(tess-&gt;<a class="code" href="a00607.html#a97fde2a457aa76137737b247a2418cb7">pix_binary</a>(),
 
284
<a name="l00183"></a>00183                                            blocks, to_blocks);
 
285
<a name="l00184"></a>00184 }
 
286
<a name="l00185"></a>00185 
 
287
<a name="l00186"></a>00186 <span class="comment">// Find connected components in the page and process a subset until finished or</span>
 
288
<a name="l00187"></a>00187 <span class="comment">// a stopping criterion is met.</span>
 
289
<a name="l00188"></a>00188 <span class="comment">// Returns the number of blobs used in making the estimate. 0 implies failure.</span>
 
290
<a name="l00189"></a><a class="code" href="a00688.html#af7ea57b0e1847f524c98576cb5cace43">00189</a> <span class="keywordtype">int</span> <a class="code" href="a00687.html#aec0e2284de8927ea9f29b61ff30d052a">orientation_and_script_detection</a>(<a class="code" href="a00557.html">STRING</a>&amp; <a class="code" href="a01266.html#a61c02c0afc996e6b9c619f0a757af50b">filename</a>,
 
291
<a name="l00190"></a>00190                                      <a class="code" href="a00478.html">OSResults</a>* osr,
 
292
<a name="l00191"></a>00191                                      <a class="code" href="a00607.html">tesseract::Tesseract</a>* tess) {
 
293
<a name="l00192"></a>00192   <a class="code" href="a00557.html">STRING</a> name = <a class="code" href="a01266.html#a61c02c0afc996e6b9c619f0a757af50b">filename</a>;        <span class="comment">//truncated name</span>
 
294
<a name="l00193"></a>00193   <span class="keyword">const</span> <span class="keywordtype">char</span> *lastdot;           <span class="comment">//of name</span>
 
295
<a name="l00194"></a>00194   <a class="code" href="a00592.html">TBOX</a> page_box;
 
296
<a name="l00195"></a>00195 
 
297
<a name="l00196"></a>00196   lastdot = strrchr (name.<a class="code" href="a00557.html#a32beee43ecab1bed8bebc3466896ad6e">string</a> (), <span class="charliteral">&#39;.&#39;</span>);
 
298
<a name="l00197"></a>00197   <span class="keywordflow">if</span> (lastdot != NULL)
 
299
<a name="l00198"></a>00198     name[lastdot-name.<a class="code" href="a00557.html#a32beee43ecab1bed8bebc3466896ad6e">string</a>()] = <span class="charliteral">&#39;\0&#39;</span>;
 
300
<a name="l00199"></a>00199 
 
301
<a name="l00200"></a>00200   <a class="code" href="a00823.html#a93a603f4063a6b9403d81caa245a583b">ASSERT_HOST</a>(tess-&gt;<a class="code" href="a00607.html#a97fde2a457aa76137737b247a2418cb7">pix_binary</a>() != NULL)
 
302
<a name="l00201"></a>00201   <span class="keywordtype">int</span> width = pixGetWidth(tess-&gt;<a class="code" href="a00607.html#a97fde2a457aa76137737b247a2418cb7">pix_binary</a>());
 
303
<a name="l00202"></a>00202   <span class="keywordtype">int</span> height = pixGetHeight(tess-&gt;<a class="code" href="a00607.html#a97fde2a457aa76137737b247a2418cb7">pix_binary</a>());
 
304
<a name="l00203"></a>00203   <span class="keywordtype">int</span> resolution = pixGetXRes(tess-&gt;<a class="code" href="a00607.html#a97fde2a457aa76137737b247a2418cb7">pix_binary</a>());
 
305
<a name="l00204"></a>00204   <span class="comment">// Zero resolution messes up the algorithms, so make sure it is credible.</span>
 
306
<a name="l00205"></a>00205   <span class="keywordflow">if</span> (resolution &lt; <a class="code" href="a00687.html#af9f4de4278c712c02788092501b587f3">kMinCredibleResolution</a>)
 
307
<a name="l00206"></a>00206     resolution = <a class="code" href="a00687.html#ad3674a322dd444a002052c5b929b1976">kDefaultResolution</a>;
 
308
<a name="l00207"></a>00207 
 
309
<a name="l00208"></a>00208   BLOCK_LIST blocks;
 
310
<a name="l00209"></a>00209   <span class="keywordflow">if</span> (!<a class="code" href="a00731.html#ab65373023a95c3043ea26b7906e29907">read_unlv_file</a>(name, width, height, &amp;blocks))
 
311
<a name="l00210"></a>00210     <a class="code" href="a00731.html#a6d4d883ff45201c5b6166b5941cb96a2">FullPageBlock</a>(width, height, &amp;blocks);
 
312
<a name="l00211"></a>00211 
 
313
<a name="l00212"></a>00212   <span class="comment">// Try to remove non-text regions from consideration.</span>
 
314
<a name="l00213"></a>00213   TO_BLOCK_LIST land_blocks, port_blocks;
 
315
<a name="l00214"></a>00214   <a class="code" href="a00687.html#a0328b8314a9022034d90c11ac8a0b0ea">remove_nontext_regions</a>(tess, &amp;blocks, &amp;port_blocks);
 
316
<a name="l00215"></a>00215 
 
317
<a name="l00216"></a>00216   <span class="keywordflow">if</span> (port_blocks.empty()) {
 
318
<a name="l00217"></a>00217     <span class="comment">// page segmentation did not succeed, so we need to find_components first.</span>
 
319
<a name="l00218"></a>00218     tess-&gt;<a class="code" href="a00607.html#a6fa77152d6fd5c6afe14f2698413d0f9">mutable_textord</a>()-&gt;<a class="code" href="a00625.html#ab478029b49bf4efadd59a547565327a7">find_components</a>(tess-&gt;<a class="code" href="a00607.html#a97fde2a457aa76137737b247a2418cb7">pix_binary</a>(),
 
320
<a name="l00219"></a>00219                                              &amp;blocks, &amp;port_blocks);
 
321
<a name="l00220"></a>00220   } <span class="keywordflow">else</span> {
 
322
<a name="l00221"></a>00221     page_box.<a class="code" href="a00592.html#ae6151cd794841e100d8a346a0c4a46e6">set_left</a>(0);
 
323
<a name="l00222"></a>00222     page_box.<a class="code" href="a00592.html#a6f803b24b046883cb0f3882dc3d92302">set_bottom</a>(0);
 
324
<a name="l00223"></a>00223     page_box.<a class="code" href="a00592.html#a2246293d3667b28c52a52353a2d5caea">set_right</a>(width);
 
325
<a name="l00224"></a>00224     page_box.<a class="code" href="a00592.html#a7f40dfd290a907200bdc98c196f63f45">set_top</a>(height);
 
326
<a name="l00225"></a>00225     <span class="comment">// Filter_blobs sets up the TO_BLOCKs the same as find_components does.</span>
 
327
<a name="l00226"></a>00226     tess-&gt;<a class="code" href="a00607.html#a6fa77152d6fd5c6afe14f2698413d0f9">mutable_textord</a>()-&gt;<a class="code" href="a00625.html#acaed60ac5b5ef00751e3d307347aa0e9">filter_blobs</a>(page_box.<a class="code" href="a00592.html#a02511fc69b598b332ac1f4af6c943f8f">topright</a>(),
 
328
<a name="l00227"></a>00227                                           &amp;port_blocks, <span class="keyword">true</span>);
 
329
<a name="l00228"></a>00228   }
 
330
<a name="l00229"></a>00229 
 
331
<a name="l00230"></a>00230   <span class="keywordflow">return</span> <a class="code" href="a00687.html#a93fedb9cccbbcf81d3433b95bbc46bdd">os_detect</a>(&amp;port_blocks, osr, tess);
 
332
<a name="l00231"></a>00231 }
 
333
<a name="l00232"></a>00232 
 
334
<a name="l00233"></a>00233 <span class="comment">// Filter and sample the blobs.</span>
 
335
<a name="l00234"></a>00234 <span class="comment">// Returns a non-zero number of blobs if the page was successfully processed, or</span>
 
336
<a name="l00235"></a>00235 <span class="comment">// zero if the page had too few characters to be reliable</span>
 
337
<a name="l00236"></a><a class="code" href="a00688.html#a93fedb9cccbbcf81d3433b95bbc46bdd">00236</a> <span class="keywordtype">int</span> <a class="code" href="a00687.html#a93fedb9cccbbcf81d3433b95bbc46bdd">os_detect</a>(TO_BLOCK_LIST* port_blocks, <a class="code" href="a00478.html">OSResults</a>* osr,
 
338
<a name="l00237"></a>00237               <a class="code" href="a00607.html">tesseract::Tesseract</a>* tess) {
 
339
<a name="l00238"></a>00238   <span class="keywordtype">int</span> blobs_total = 0;
 
340
<a name="l00239"></a>00239   TO_BLOCK_IT block_it;
 
341
<a name="l00240"></a>00240   block_it.set_to_list(port_blocks);
 
342
<a name="l00241"></a>00241 
 
343
<a name="l00242"></a>00242   BLOBNBOX_CLIST filtered_list;
 
344
<a name="l00243"></a>00243   BLOBNBOX_C_IT filtered_it(&amp;filtered_list);
 
345
<a name="l00244"></a>00244 
 
346
<a name="l00245"></a>00245   <span class="keywordflow">for</span> (block_it.mark_cycle_pt(); !block_it.cycled_list();
 
347
<a name="l00246"></a>00246        block_it.forward ()) {
 
348
<a name="l00247"></a>00247     <a class="code" href="a00627.html">TO_BLOCK</a>* to_block = block_it.data();
 
349
<a name="l00248"></a>00248     <span class="keywordflow">if</span> (to_block-&gt;<a class="code" href="a00627.html#a16e698664028b0d6d2193db64560c16b">block</a>-&gt;<a class="code" href="a00500.html#a6670779c69aca2d574e4a0590d9b3939">poly_block</a>() &amp;&amp;
 
350
<a name="l00249"></a>00249         !to_block-&gt;<a class="code" href="a00627.html#a16e698664028b0d6d2193db64560c16b">block</a>-&gt;<a class="code" href="a00500.html#a6670779c69aca2d574e4a0590d9b3939">poly_block</a>()-&gt;<a class="code" href="a00505.html#abd32dee532afe634cdbacffc0b53e660">IsText</a>()) <span class="keywordflow">continue</span>;
 
351
<a name="l00250"></a>00250     BLOBNBOX_IT bbox_it;
 
352
<a name="l00251"></a>00251     bbox_it.set_to_list(&amp;to_block-&gt;<a class="code" href="a00627.html#a5dd67c54162a6b60b0fd11500d4a3025">blobs</a>);
 
353
<a name="l00252"></a>00252     <span class="keywordflow">for</span> (bbox_it.mark_cycle_pt (); !bbox_it.cycled_list ();
 
354
<a name="l00253"></a>00253          bbox_it.forward ()) {
 
355
<a name="l00254"></a>00254       <a class="code" href="a00279.html">BLOBNBOX</a>* bbox = bbox_it.data();
 
356
<a name="l00255"></a>00255       <a class="code" href="a00289.html">C_BLOB</a>*   blob = bbox-&gt;<a class="code" href="a00279.html#a483f44541a4dd818f02225c92f030e07">cblob</a>();
 
357
<a name="l00256"></a>00256       <a class="code" href="a00592.html">TBOX</a>      box = blob-&gt;<a class="code" href="a00289.html#a77e52e29e2c622a3a63bb7edb110f6ab">bounding_box</a>();
 
358
<a name="l00257"></a>00257       ++blobs_total;
 
359
<a name="l00258"></a>00258 
 
360
<a name="l00259"></a>00259       <span class="keywordtype">float</span> y_x = fabs((box.<a class="code" href="a00592.html#a8379d4bbc72bdbb1f069fc14790e632d">height</a>() * 1.0) / box.<a class="code" href="a00592.html#af95494a2ccacc70cc2b83820b2948619">width</a>());
 
361
<a name="l00260"></a>00260       <span class="keywordtype">float</span> x_y = 1.0f / y_x;
 
362
<a name="l00261"></a>00261       <span class="comment">// Select a &gt;= 1.0 ratio</span>
 
363
<a name="l00262"></a>00262       <span class="keywordtype">float</span> ratio = x_y &gt; y_x ? x_y : y_x;
 
364
<a name="l00263"></a>00263       <span class="comment">// Blob is ambiguous</span>
 
365
<a name="l00264"></a>00264       <span class="keywordflow">if</span> (ratio &gt; <a class="code" href="a00687.html#ac23eec99b25d1c109fb6ee2590a331bf">kSizeRatioToReject</a>) <span class="keywordflow">continue</span>;
 
366
<a name="l00265"></a>00265       <span class="keywordflow">if</span> (box.<a class="code" href="a00592.html#a8379d4bbc72bdbb1f069fc14790e632d">height</a>() &lt; <a class="code" href="a00687.html#aaba53b59683a4788881c7b8281f25fac">kMinAcceptableBlobHeight</a>) <span class="keywordflow">continue</span>;
 
367
<a name="l00266"></a>00266       filtered_it.add_to_end(bbox);
 
368
<a name="l00267"></a>00267     }
 
369
<a name="l00268"></a>00268   }
 
370
<a name="l00269"></a>00269   <span class="keywordflow">return</span> <a class="code" href="a00687.html#a1007e747656418b79d4ce9f8f14f2a7b">os_detect_blobs</a>(&amp;filtered_list, osr, tess);
 
371
<a name="l00270"></a>00270 }
 
372
<a name="l00271"></a>00271 
 
373
<a name="l00272"></a>00272 <span class="comment">// Detect orientation and script from a list of blobs.</span>
 
374
<a name="l00273"></a>00273 <span class="comment">// Returns a non-zero number of blobs if the list was successfully processed, or</span>
 
375
<a name="l00274"></a>00274 <span class="comment">// zero if the list had too few characters to be reliable</span>
 
376
<a name="l00275"></a><a class="code" href="a00688.html#a1007e747656418b79d4ce9f8f14f2a7b">00275</a> <span class="keywordtype">int</span> <a class="code" href="a00687.html#a1007e747656418b79d4ce9f8f14f2a7b">os_detect_blobs</a>(BLOBNBOX_CLIST* blob_list, <a class="code" href="a00478.html">OSResults</a>* osr,
 
377
<a name="l00276"></a>00276                     <a class="code" href="a00607.html">tesseract::Tesseract</a>* tess) {
 
378
<a name="l00277"></a>00277   <a class="code" href="a00478.html">OSResults</a> osr_;
 
379
<a name="l00278"></a>00278   <span class="keywordflow">if</span> (osr == NULL)
 
380
<a name="l00279"></a>00279     osr = &amp;osr_;
 
381
<a name="l00280"></a>00280 
 
382
<a name="l00281"></a>00281   osr-&gt;<a class="code" href="a00478.html#a78ebdae52f3c685095b56790598ad97c">unicharset</a> = &amp;tess-&gt;<a class="code" href="a00295.html#a69c5179ac5f10a24f3f97e16ca09460f">unicharset</a>;
 
383
<a name="l00282"></a>00282   <a class="code" href="a00476.html">OrientationDetector</a> o(osr);
 
384
<a name="l00283"></a>00283   <a class="code" href="a00530.html">ScriptDetector</a> s(osr, tess);
 
385
<a name="l00284"></a>00284 
 
386
<a name="l00285"></a>00285   BLOBNBOX_C_IT filtered_it(blob_list);
 
387
<a name="l00286"></a>00286   <span class="keywordtype">int</span> real_max = MIN(filtered_it.length(), <a class="code" href="a00687.html#ab1eb3d41a8092b2cc34e2c1d17886521">kMaxCharactersToTry</a>);
 
388
<a name="l00287"></a>00287   <span class="comment">// tprintf(&quot;Total blobs found = %d\n&quot;, blobs_total);</span>
 
389
<a name="l00288"></a>00288   <span class="comment">// tprintf(&quot;Number of blobs post-filtering = %d\n&quot;, filtered_it.length());</span>
 
390
<a name="l00289"></a>00289   <span class="comment">// tprintf(&quot;Number of blobs to try = %d\n&quot;, real_max);</span>
 
391
<a name="l00290"></a>00290 
 
392
<a name="l00291"></a>00291   <span class="comment">// If there are too few characters, skip this page entirely.</span>
 
393
<a name="l00292"></a>00292   <span class="keywordflow">if</span> (real_max &lt; <a class="code" href="a00687.html#a1dcbb4454cb6c97be113fc6ae820c958">kMinCharactersToTry</a> / 2) {
 
394
<a name="l00293"></a>00293     <a class="code" href="a00860.html#a02aa7cca2c3857c14716e8cca96ace6c">tprintf</a>(<span class="stringliteral">&quot;Too few characters. Skipping this page\n&quot;</span>);
 
395
<a name="l00294"></a>00294     <span class="keywordflow">return</span> 0;
 
396
<a name="l00295"></a>00295   }
 
397
<a name="l00296"></a>00296 
 
398
<a name="l00297"></a>00297   <a class="code" href="a00279.html">BLOBNBOX</a>** blobs = <span class="keyword">new</span> <a class="code" href="a00279.html">BLOBNBOX</a>*[filtered_it.length()];
 
399
<a name="l00298"></a>00298   <span class="keywordtype">int</span> number_of_blobs = 0;
 
400
<a name="l00299"></a>00299   <span class="keywordflow">for</span> (filtered_it.mark_cycle_pt (); !filtered_it.cycled_list ();
 
401
<a name="l00300"></a>00300        filtered_it.forward ()) {
 
402
<a name="l00301"></a>00301     blobs[number_of_blobs++] = (<a class="code" href="a00279.html">BLOBNBOX</a>*)filtered_it.data();
 
403
<a name="l00302"></a>00302   }
 
404
<a name="l00303"></a>00303   <a class="code" href="a00512.html">QRSequenceGenerator</a> sequence(number_of_blobs);
 
405
<a name="l00304"></a>00304   <span class="keywordtype">int</span> num_blobs_evaluated = 0;
 
406
<a name="l00305"></a>00305   <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 0; i &lt; real_max; ++i) {
 
407
<a name="l00306"></a>00306     <span class="keywordflow">if</span> (<a class="code" href="a00687.html#a35fb2b0177ed2a774307373aeb7b13d1">os_detect_blob</a>(blobs[sequence.<a class="code" href="a00512.html#a28c125707aded762182e647e0ec91900">GetVal</a>()], &amp;o, &amp;s, osr, tess)
 
408
<a name="l00307"></a>00307         &amp;&amp; i &gt; <a class="code" href="a00687.html#a1dcbb4454cb6c97be113fc6ae820c958">kMinCharactersToTry</a>) {
 
409
<a name="l00308"></a>00308       <span class="keywordflow">break</span>;
 
410
<a name="l00309"></a>00309     }
 
411
<a name="l00310"></a>00310     ++num_blobs_evaluated;
 
412
<a name="l00311"></a>00311   }
 
413
<a name="l00312"></a>00312   <span class="keyword">delete</span> [] blobs;
 
414
<a name="l00313"></a>00313 
 
415
<a name="l00314"></a>00314   <span class="comment">// Make sure the best_result is up-to-date</span>
 
416
<a name="l00315"></a>00315   <span class="keywordtype">int</span> orientation = o.<a class="code" href="a00476.html#a382b5269675f9db848485be62f35742e">get_orientation</a>();
 
417
<a name="l00316"></a>00316   osr-&gt;<a class="code" href="a00478.html#ab796da60cc16d39f464c03fe4047c358">update_best_script</a>(orientation);
 
418
<a name="l00317"></a>00317   <span class="keywordflow">return</span> num_blobs_evaluated;
 
419
<a name="l00318"></a>00318 }
 
420
<a name="l00319"></a>00319 
 
421
<a name="l00320"></a>00320 <span class="comment">// Processes a single blob to estimate script and orientation.</span>
 
422
<a name="l00321"></a>00321 <span class="comment">// Return true if estimate of orientation and script satisfies stopping</span>
 
423
<a name="l00322"></a>00322 <span class="comment">// criteria.</span>
 
424
<a name="l00323"></a><a class="code" href="a00688.html#acd67dc649eafb2a0048434366730af2e">00323</a> <span class="keywordtype">bool</span> <a class="code" href="a00687.html#a35fb2b0177ed2a774307373aeb7b13d1">os_detect_blob</a>(<a class="code" href="a00279.html">BLOBNBOX</a>* bbox, <a class="code" href="a00476.html">OrientationDetector</a>* o,
 
425
<a name="l00324"></a>00324                     <a class="code" href="a00530.html">ScriptDetector</a>* s, <a class="code" href="a00478.html">OSResults</a>* osr,
 
426
<a name="l00325"></a>00325                     <a class="code" href="a00607.html">tesseract::Tesseract</a>* tess) {
 
427
<a name="l00326"></a>00326   tess-&gt;<a class="code" href="a00314.html#a746dbbd1c99e99f3d213077cceedf80e">tess_cn_matching</a>.set_value(<span class="keyword">true</span>); <span class="comment">// turn it on</span>
 
428
<a name="l00327"></a>00327   tess-&gt;<a class="code" href="a00314.html#a85fcc9966cddbc38adf1014dd0cd778c">tess_bn_matching</a>.set_value(<span class="keyword">false</span>);
 
429
<a name="l00328"></a>00328   <a class="code" href="a00289.html">C_BLOB</a>* blob = bbox-&gt;<a class="code" href="a00279.html#a483f44541a4dd818f02225c92f030e07">cblob</a>();
 
430
<a name="l00329"></a>00329   <a class="code" href="a00591.html">TBLOB</a>* tblob = <a class="code" href="a00591.html#a7b6051e1c1934265a91e1ee864bd5164">TBLOB::PolygonalCopy</a>(tess-&gt;<a class="code" href="a00607.html#ae1206c0c4b63a008cc01650004fb7b03">poly_allow_detailed_fx</a>, blob);
 
431
<a name="l00330"></a>00330   <a class="code" href="a00592.html">TBOX</a> box = tblob-&gt;<a class="code" href="a00591.html#a8f1f8f110170fe12cf8147d504cd0ea2">bounding_box</a>();
 
432
<a name="l00331"></a>00331   <a class="code" href="a00375.html">FCOORD</a> current_rotation(1.0f, 0.0f);
 
433
<a name="l00332"></a>00332   <a class="code" href="a00375.html">FCOORD</a> rotation90(0.0f, 1.0f);
 
434
<a name="l00333"></a>00333   BLOB_CHOICE_LIST ratings[4];
 
435
<a name="l00334"></a>00334   <span class="comment">// Test the 4 orientations</span>
 
436
<a name="l00335"></a>00335   <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 0; i &lt; 4; ++i) {
 
437
<a name="l00336"></a>00336     <span class="comment">// Normalize the blob. Set the origin to the place we want to be the</span>
 
438
<a name="l00337"></a>00337     <span class="comment">// bottom-middle after rotation.</span>
 
439
<a name="l00338"></a>00338     <span class="comment">// Scaling is to make the rotated height the x-height.</span>
 
440
<a name="l00339"></a>00339     <span class="keywordtype">float</span> scaling = <span class="keyword">static_cast&lt;</span><span class="keywordtype">float</span><span class="keyword">&gt;</span>(<a class="code" href="a00759.html#af974e6755e636c8bc7cbe57e3bcbdd73">kBlnXHeight</a>) / box.<a class="code" href="a00592.html#a8379d4bbc72bdbb1f069fc14790e632d">height</a>();
 
441
<a name="l00340"></a>00340     <span class="keywordtype">float</span> x_origin = (box.<a class="code" href="a00592.html#a724fabf566586b663577dfa944ffbc61">left</a>() + box.<a class="code" href="a00592.html#a8703081c1a1c26db3a4dddaca1028e34">right</a>()) / 2.0f;
 
442
<a name="l00341"></a>00341     <span class="keywordtype">float</span> y_origin = (box.<a class="code" href="a00592.html#a4451d237f1cd18c4982d63fe36a11fc3">bottom</a>() + box.<a class="code" href="a00592.html#adf92e9fdac1bdf11c10d1c4d1178791a">top</a>()) / 2.0f;
 
443
<a name="l00342"></a>00342     <span class="keywordflow">if</span> (i == 0 || i == 2) {
 
444
<a name="l00343"></a>00343       <span class="comment">// Rotation is 0 or 180.</span>
 
445
<a name="l00344"></a>00344       y_origin = i == 0 ? box.<a class="code" href="a00592.html#a4451d237f1cd18c4982d63fe36a11fc3">bottom</a>() : box.<a class="code" href="a00592.html#adf92e9fdac1bdf11c10d1c4d1178791a">top</a>();
 
446
<a name="l00345"></a>00345     } <span class="keywordflow">else</span> {
 
447
<a name="l00346"></a>00346       <span class="comment">// Rotation is 90 or 270.</span>
 
448
<a name="l00347"></a>00347       scaling = <span class="keyword">static_cast&lt;</span><span class="keywordtype">float</span><span class="keyword">&gt;</span>(<a class="code" href="a00759.html#af974e6755e636c8bc7cbe57e3bcbdd73">kBlnXHeight</a>) / box.<a class="code" href="a00592.html#af95494a2ccacc70cc2b83820b2948619">width</a>();
 
449
<a name="l00348"></a>00348       x_origin = i == 1 ? box.<a class="code" href="a00592.html#a724fabf566586b663577dfa944ffbc61">left</a>() : box.<a class="code" href="a00592.html#a8703081c1a1c26db3a4dddaca1028e34">right</a>();
 
450
<a name="l00349"></a>00349     }
 
451
<a name="l00350"></a>00350     <a class="code" href="a00591.html">TBLOB</a>* rotated_blob = <span class="keyword">new</span> <a class="code" href="a00591.html">TBLOB</a>(*tblob);
 
452
<a name="l00351"></a>00351     rotated_blob-&gt;<a class="code" href="a00591.html#a6aef0201c756ed33e68a94abc8ac2b8e">Normalize</a>(NULL, &amp;current_rotation, NULL,
 
453
<a name="l00352"></a>00352                             x_origin, y_origin, scaling, scaling,
 
454
<a name="l00353"></a>00353                             0.0f, static_cast&lt;float&gt;(<a class="code" href="a00759.html#abe10ce41bf7240ae8a053dea471d6ed5">kBlnBaselineOffset</a>),
 
455
<a name="l00354"></a>00354                             <span class="keyword">false</span>, NULL);
 
456
<a name="l00355"></a>00355     tess-&gt;<a class="code" href="a00314.html#ab39a42222f621c9a5f1bd1b31db3a930">AdaptiveClassifier</a>(rotated_blob, ratings + i);
 
457
<a name="l00356"></a>00356     <span class="keyword">delete</span> rotated_blob;
 
458
<a name="l00357"></a>00357     current_rotation.<a class="code" href="a00375.html#a81ca9ea0cac4cd8c1bca0314e29bb28d">rotate</a>(rotation90);
 
459
<a name="l00358"></a>00358   }
 
460
<a name="l00359"></a>00359   <span class="keyword">delete</span> tblob;
 
461
<a name="l00360"></a>00360 
 
462
<a name="l00361"></a>00361   <span class="keywordtype">bool</span> stop = o-&gt;<a class="code" href="a00476.html#a7f3ad682712b5ff3bfcecca0a8a5b086">detect_blob</a>(ratings);
 
463
<a name="l00362"></a>00362   s-&gt;<a class="code" href="a00530.html#aa1626a91138960515d479a781a6b97ca">detect_blob</a>(ratings);
 
464
<a name="l00363"></a>00363   <span class="keywordtype">int</span> orientation = o-&gt;<a class="code" href="a00476.html#a382b5269675f9db848485be62f35742e">get_orientation</a>();
 
465
<a name="l00364"></a>00364   stop = s-&gt;<a class="code" href="a00530.html#a951bd4d3f5b14ee234d20afc91d44585">must_stop</a>(orientation) &amp;&amp; stop;
 
466
<a name="l00365"></a>00365   <span class="keywordflow">return</span> stop;
 
467
<a name="l00366"></a>00366 }
 
468
<a name="l00367"></a>00367 
 
469
<a name="l00368"></a>00368 
 
470
<a name="l00369"></a><a class="code" href="a00476.html#aa00a93a069267a2636ec74f4ebb11095">00369</a> <a class="code" href="a00476.html#aa00a93a069267a2636ec74f4ebb11095">OrientationDetector::OrientationDetector</a>(<a class="code" href="a00478.html">OSResults</a>* osr) {
 
471
<a name="l00370"></a>00370   osr_ = osr;
 
472
<a name="l00371"></a>00371 }
 
473
<a name="l00372"></a>00372 
 
474
<a name="l00373"></a>00373 <span class="comment">// Score the given blob and return true if it is now sure of the orientation</span>
 
475
<a name="l00374"></a>00374 <span class="comment">// after adding this block.</span>
 
476
<a name="l00375"></a><a class="code" href="a00476.html#a7f3ad682712b5ff3bfcecca0a8a5b086">00375</a> <span class="keywordtype">bool</span> <a class="code" href="a00476.html#a7f3ad682712b5ff3bfcecca0a8a5b086">OrientationDetector::detect_blob</a>(BLOB_CHOICE_LIST* scores) {
 
477
<a name="l00376"></a>00376   <span class="keywordtype">float</span> blob_o_score[4] = {0.0, 0.0, 0.0, 0.0};
 
478
<a name="l00377"></a>00377   <span class="keywordtype">float</span> total_blob_o_score = 0.0;
 
479
<a name="l00378"></a>00378 
 
480
<a name="l00379"></a>00379   <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 0; i &lt; 4; ++i) {
 
481
<a name="l00380"></a>00380     BLOB_CHOICE_IT choice_it;
 
482
<a name="l00381"></a>00381     choice_it.set_to_list(scores + i);
 
483
<a name="l00382"></a>00382     <span class="keywordflow">if</span> (!choice_it.empty()) {
 
484
<a name="l00383"></a>00383       <span class="comment">// The certainty score ranges between [-20,0]. This is converted here to</span>
 
485
<a name="l00384"></a>00384       <span class="comment">// [0,1], with 1 indicating best match.</span>
 
486
<a name="l00385"></a>00385       blob_o_score[i] = 1 + 0.05 * choice_it.data()-&gt;certainty();
 
487
<a name="l00386"></a>00386       total_blob_o_score += blob_o_score[i];
 
488
<a name="l00387"></a>00387     }
 
489
<a name="l00388"></a>00388   }
 
490
<a name="l00389"></a>00389   <span class="comment">// Normalize the orientation scores for the blob and use them to</span>
 
491
<a name="l00390"></a>00390   <span class="comment">// update the aggregated orientation score.</span>
 
492
<a name="l00391"></a>00391   <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 0; total_blob_o_score != 0 &amp;&amp; i &lt; 4; ++i) {
 
493
<a name="l00392"></a>00392     osr_-&gt;<a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[i] += log(blob_o_score[i] / total_blob_o_score);
 
494
<a name="l00393"></a>00393   }
 
495
<a name="l00394"></a>00394 
 
496
<a name="l00395"></a>00395   <span class="keywordtype">float</span> first = -1;
 
497
<a name="l00396"></a>00396   <span class="keywordtype">float</span> second = -1;
 
498
<a name="l00397"></a>00397 
 
499
<a name="l00398"></a>00398   <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 0; i &lt; 4; ++i) {
 
500
<a name="l00399"></a>00399     <span class="keywordflow">if</span> (osr_-&gt;<a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[i] &gt; first) {
 
501
<a name="l00400"></a>00400       second = first;
 
502
<a name="l00401"></a>00401       first = osr_-&gt;<a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[i];
 
503
<a name="l00402"></a>00402     } <span class="keywordflow">else</span> <span class="keywordflow">if</span> (osr_-&gt;<a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[i] &gt; second) {
 
504
<a name="l00403"></a>00403       second = osr_-&gt;<a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[i];
 
505
<a name="l00404"></a>00404     }
 
506
<a name="l00405"></a>00405   }
 
507
<a name="l00406"></a>00406 
 
508
<a name="l00407"></a>00407   <span class="keywordflow">return</span> first / second &gt; <a class="code" href="a00687.html#ad58ecd1e0aa2241ba3ccd5d0398c1e5c">kOrientationAcceptRatio</a>;
 
509
<a name="l00408"></a>00408 }
 
510
<a name="l00409"></a>00409 
 
511
<a name="l00410"></a><a class="code" href="a00476.html#a382b5269675f9db848485be62f35742e">00410</a> <span class="keywordtype">int</span> <a class="code" href="a00476.html#a382b5269675f9db848485be62f35742e">OrientationDetector::get_orientation</a>() {
 
512
<a name="l00411"></a>00411   osr_-&gt;<a class="code" href="a00478.html#af7b5cea89a2bdace52ad5825d6d5d4e6">update_best_orientation</a>();
 
513
<a name="l00412"></a>00412   <span class="keywordflow">return</span> osr_-&gt;<a class="code" href="a00478.html#a25f64011ea65c038c1ef1a6cedd10f1c">best_result</a>.<a class="code" href="a00477.html#a6dfb6826b41a81524ce867b005ba5641">orientation_id</a>;
 
514
<a name="l00413"></a>00413 }
 
515
<a name="l00414"></a>00414 
 
516
<a name="l00415"></a>00415 
 
517
<a name="l00416"></a><a class="code" href="a00530.html#ac44d1acf5214aecb8437e160e30db1d4">00416</a> <a class="code" href="a00530.html#ac44d1acf5214aecb8437e160e30db1d4">ScriptDetector::ScriptDetector</a>(<a class="code" href="a00478.html">OSResults</a>* osr, <a class="code" href="a00607.html">tesseract::Tesseract</a>* tess) {
 
518
<a name="l00417"></a>00417   osr_ = osr;
 
519
<a name="l00418"></a>00418   tess_ = tess;
 
520
<a name="l00419"></a>00419   katakana_id_ = tess_-&gt;<a class="code" href="a00295.html#a69c5179ac5f10a24f3f97e16ca09460f">unicharset</a>.<a class="code" href="a00642.html#a7cbfd800fe71082f0e7d58b7c25330bb">add_script</a>(katakana_script);
 
521
<a name="l00420"></a>00420   hiragana_id_ = tess_-&gt;<a class="code" href="a00295.html#a69c5179ac5f10a24f3f97e16ca09460f">unicharset</a>.<a class="code" href="a00642.html#a7cbfd800fe71082f0e7d58b7c25330bb">add_script</a>(hiragana_script);
 
522
<a name="l00421"></a>00421   han_id_ = tess_-&gt;<a class="code" href="a00295.html#a69c5179ac5f10a24f3f97e16ca09460f">unicharset</a>.<a class="code" href="a00642.html#a7cbfd800fe71082f0e7d58b7c25330bb">add_script</a>(han_script);
 
523
<a name="l00422"></a>00422   hangul_id_ = tess_-&gt;<a class="code" href="a00295.html#a69c5179ac5f10a24f3f97e16ca09460f">unicharset</a>.<a class="code" href="a00642.html#a7cbfd800fe71082f0e7d58b7c25330bb">add_script</a>(hangul_script);
 
524
<a name="l00423"></a>00423   japanese_id_ = tess_-&gt;<a class="code" href="a00295.html#a69c5179ac5f10a24f3f97e16ca09460f">unicharset</a>.<a class="code" href="a00642.html#a7cbfd800fe71082f0e7d58b7c25330bb">add_script</a>(japanese_script_);
 
525
<a name="l00424"></a>00424   korean_id_ = tess_-&gt;<a class="code" href="a00295.html#a69c5179ac5f10a24f3f97e16ca09460f">unicharset</a>.<a class="code" href="a00642.html#a7cbfd800fe71082f0e7d58b7c25330bb">add_script</a>(korean_script_);
 
526
<a name="l00425"></a>00425   latin_id_ = tess_-&gt;<a class="code" href="a00295.html#a69c5179ac5f10a24f3f97e16ca09460f">unicharset</a>.<a class="code" href="a00642.html#a7cbfd800fe71082f0e7d58b7c25330bb">add_script</a>(latin_script);
 
527
<a name="l00426"></a>00426   fraktur_id_ = tess_-&gt;<a class="code" href="a00295.html#a69c5179ac5f10a24f3f97e16ca09460f">unicharset</a>.<a class="code" href="a00642.html#a7cbfd800fe71082f0e7d58b7c25330bb">add_script</a>(fraktur_script_);
 
528
<a name="l00427"></a>00427 }
 
529
<a name="l00428"></a>00428 
 
530
<a name="l00429"></a>00429 
 
531
<a name="l00430"></a>00430 <span class="comment">// Score the given blob and return true if it is now sure of the script after</span>
 
532
<a name="l00431"></a>00431 <span class="comment">// adding this blob.</span>
 
533
<a name="l00432"></a><a class="code" href="a00530.html#aa1626a91138960515d479a781a6b97ca">00432</a> <span class="keywordtype">void</span> <a class="code" href="a00530.html#aa1626a91138960515d479a781a6b97ca">ScriptDetector::detect_blob</a>(BLOB_CHOICE_LIST* scores) {
 
534
<a name="l00433"></a>00433   <span class="keywordtype">bool</span> done[<a class="code" href="a00688.html#ab52d878a730b63bcf57d7bb3113882a1">kMaxNumberOfScripts</a>];
 
535
<a name="l00434"></a>00434   <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 0; i &lt; 4; ++i) {
 
536
<a name="l00435"></a>00435     <span class="keywordflow">for</span> (<span class="keywordtype">int</span> j = 0; j &lt; <a class="code" href="a00688.html#ab52d878a730b63bcf57d7bb3113882a1">kMaxNumberOfScripts</a>; ++j)
 
537
<a name="l00436"></a>00436       done[j] = <span class="keyword">false</span>;
 
538
<a name="l00437"></a>00437 
 
539
<a name="l00438"></a>00438     BLOB_CHOICE_IT choice_it;
 
540
<a name="l00439"></a>00439     choice_it.set_to_list(scores + i);
 
541
<a name="l00440"></a>00440 
 
542
<a name="l00441"></a>00441     <span class="keywordtype">float</span> prev_score = -1;
 
543
<a name="l00442"></a>00442     <span class="keywordtype">int</span> script_count = 0;
 
544
<a name="l00443"></a>00443     <span class="keywordtype">int</span> prev_id = -1;
 
545
<a name="l00444"></a>00444     <span class="keywordtype">int</span> prev_fontinfo_id = -1;
 
546
<a name="l00445"></a>00445     <span class="keyword">const</span> <span class="keywordtype">char</span>* prev_unichar = <span class="stringliteral">&quot;&quot;</span>;
 
547
<a name="l00446"></a>00446     <span class="keyword">const</span> <span class="keywordtype">char</span>* unichar = <span class="stringliteral">&quot;&quot;</span>;
 
548
<a name="l00447"></a>00447 
 
549
<a name="l00448"></a>00448     <span class="keywordflow">for</span> (choice_it.mark_cycle_pt(); !choice_it.cycled_list();
 
550
<a name="l00449"></a>00449          choice_it.forward()) {
 
551
<a name="l00450"></a>00450       <a class="code" href="a00276.html">BLOB_CHOICE</a>* choice = choice_it.data();
 
552
<a name="l00451"></a>00451       <span class="keywordtype">int</span> <span class="keywordtype">id</span> = choice-&gt;<a class="code" href="a00276.html#a746d149d149ec75e4bea96f338b48433">script_id</a>();
 
553
<a name="l00452"></a>00452       <span class="comment">// Script already processed before.</span>
 
554
<a name="l00453"></a>00453       <span class="keywordflow">if</span> (done[<span class="keywordtype">id</span>]) <span class="keywordflow">continue</span>;
 
555
<a name="l00454"></a>00454       done[id] = <span class="keyword">true</span>;
 
556
<a name="l00455"></a>00455 
 
557
<a name="l00456"></a>00456       unichar = tess_-&gt;<a class="code" href="a00295.html#a69c5179ac5f10a24f3f97e16ca09460f">unicharset</a>.<a class="code" href="a00642.html#a421c0b6ebcbbe7547490252fb688c961">id_to_unichar</a>(choice-&gt;<a class="code" href="a00276.html#aaba6190b77c5f3dc21905fc4118afa94">unichar_id</a>());
 
558
<a name="l00457"></a>00457       <span class="comment">// Save data from the first match</span>
 
559
<a name="l00458"></a>00458       <span class="keywordflow">if</span> (prev_score &lt; 0) {
 
560
<a name="l00459"></a>00459         prev_score = -choice-&gt;<a class="code" href="a00276.html#af53d45b718c562ea7209b583c77ac14e">certainty</a>();
 
561
<a name="l00460"></a>00460         script_count = 1;
 
562
<a name="l00461"></a>00461         prev_id = id;
 
563
<a name="l00462"></a>00462         prev_unichar = unichar;
 
564
<a name="l00463"></a>00463         prev_fontinfo_id = choice-&gt;<a class="code" href="a00276.html#a3594e34861be86d775724f5f91fba3be">fontinfo_id</a>();
 
565
<a name="l00464"></a>00464       } <span class="keywordflow">else</span> <span class="keywordflow">if</span> (-choice-&gt;<a class="code" href="a00276.html#af53d45b718c562ea7209b583c77ac14e">certainty</a>() &lt; prev_score + <a class="code" href="a00687.html#a14c7913eafbd3237afbdd7c6b498b2d8">kNonAmbiguousMargin</a>) {
 
566
<a name="l00465"></a>00465         ++script_count;
 
567
<a name="l00466"></a>00466       }
 
568
<a name="l00467"></a>00467 
 
569
<a name="l00468"></a>00468       <span class="keywordflow">if</span> (strlen(prev_unichar) == 1)
 
570
<a name="l00469"></a>00469         <span class="keywordflow">if</span> (unichar[0] &gt;= <span class="charliteral">&#39;0&#39;</span> &amp;&amp; unichar[0] &lt;= <span class="charliteral">&#39;9&#39;</span>)
 
571
<a name="l00470"></a>00470           <span class="keywordflow">break</span>;
 
572
<a name="l00471"></a>00471 
 
573
<a name="l00472"></a>00472       <span class="comment">// if script_count is &gt;= 2, character is ambiguous, skip other matches</span>
 
574
<a name="l00473"></a>00473       <span class="comment">// since they are useless.</span>
 
575
<a name="l00474"></a>00474       <span class="keywordflow">if</span> (script_count &gt;= 2)
 
576
<a name="l00475"></a>00475         <span class="keywordflow">break</span>;
 
577
<a name="l00476"></a>00476     }
 
578
<a name="l00477"></a>00477     <span class="comment">// Character is non ambiguous</span>
 
579
<a name="l00478"></a>00478     <span class="keywordflow">if</span> (script_count == 1) {
 
580
<a name="l00479"></a>00479       <span class="comment">// Update the score of the winning script</span>
 
581
<a name="l00480"></a>00480       osr_-&gt;<a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[i][prev_id] += 1.0;
 
582
<a name="l00481"></a>00481 
 
583
<a name="l00482"></a>00482       <span class="comment">// Workaround for Fraktur</span>
 
584
<a name="l00483"></a>00483       <span class="keywordflow">if</span> (prev_id == latin_id_) {
 
585
<a name="l00484"></a>00484         <span class="keywordflow">if</span> (prev_fontinfo_id &gt;= 0) {
 
586
<a name="l00485"></a>00485           <span class="keyword">const</span> <a class="code" href="a00389.html">tesseract::FontInfo</a> &amp;fi =
 
587
<a name="l00486"></a>00486               tess_-&gt;<a class="code" href="a00314.html#a62597f182a5e23c3b8a030c06e699e99">get_fontinfo_table</a>().<a class="code" href="a00643.html#a3b3107bc72d9edfe501eaba7404de7eb" title="Return the object from an id.">get</a>(prev_fontinfo_id);
 
588
<a name="l00487"></a>00487           <span class="comment">//printf(&quot;Font: %s i:%i b:%i f:%i s:%i k:%i (%s)\n&quot;, fi.name,</span>
 
589
<a name="l00488"></a>00488           <span class="comment">//       fi.is_italic(), fi.is_bold(), fi.is_fixed_pitch(),</span>
 
590
<a name="l00489"></a>00489           <span class="comment">//       fi.is_serif(), fi.is_fraktur(),</span>
 
591
<a name="l00490"></a>00490           <span class="comment">//       prev_unichar);</span>
 
592
<a name="l00491"></a>00491           <span class="keywordflow">if</span> (fi.<a class="code" href="a00389.html#a5a918bad85fde70770f60853355c1716">is_fraktur</a>()) {
 
593
<a name="l00492"></a>00492             osr_-&gt;<a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[i][prev_id] -= 1.0;
 
594
<a name="l00493"></a>00493             osr_-&gt;<a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[i][fraktur_id_] += 1.0;
 
595
<a name="l00494"></a>00494           }
 
596
<a name="l00495"></a>00495         }
 
597
<a name="l00496"></a>00496       }
 
598
<a name="l00497"></a>00497 
 
599
<a name="l00498"></a>00498       <span class="comment">// Update Japanese / Korean pseudo-scripts</span>
 
600
<a name="l00499"></a>00499       <span class="keywordflow">if</span> (prev_id == katakana_id_)
 
601
<a name="l00500"></a>00500         osr_-&gt;<a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[i][japanese_id_] += 1.0;
 
602
<a name="l00501"></a>00501       <span class="keywordflow">if</span> (prev_id == hiragana_id_)
 
603
<a name="l00502"></a>00502         osr_-&gt;<a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[i][japanese_id_] += 1.0;
 
604
<a name="l00503"></a>00503       <span class="keywordflow">if</span> (prev_id == hangul_id_)
 
605
<a name="l00504"></a>00504         osr_-&gt;<a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[i][korean_id_] += 1.0;
 
606
<a name="l00505"></a>00505       <span class="keywordflow">if</span> (prev_id == han_id_)
 
607
<a name="l00506"></a>00506         osr_-&gt;<a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[i][korean_id_] += <a class="code" href="a00687.html#ae3f12edb58f6ed0a11daea2cbf8dc547">kHanRatioInKorean</a>;
 
608
<a name="l00507"></a>00507       <span class="keywordflow">if</span> (prev_id == han_id_)
 
609
<a name="l00508"></a>00508         osr_-&gt;<a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[i][japanese_id_] += <a class="code" href="a00687.html#aab3b7e76eea520b1e4b9d68165e3a094">kHanRatioInJapanese</a>;
 
610
<a name="l00509"></a>00509     }
 
611
<a name="l00510"></a>00510   }  <span class="comment">// iterate over each orientation</span>
 
612
<a name="l00511"></a>00511 }
 
613
<a name="l00512"></a>00512 
 
614
<a name="l00513"></a><a class="code" href="a00530.html#a951bd4d3f5b14ee234d20afc91d44585">00513</a> <span class="keywordtype">bool</span> <a class="code" href="a00530.html#a951bd4d3f5b14ee234d20afc91d44585">ScriptDetector::must_stop</a>(<span class="keywordtype">int</span> orientation) {
 
615
<a name="l00514"></a>00514   osr_-&gt;<a class="code" href="a00478.html#ab796da60cc16d39f464c03fe4047c358">update_best_script</a>(orientation);
 
616
<a name="l00515"></a>00515   <span class="keywordflow">return</span> osr_-&gt;<a class="code" href="a00478.html#a25f64011ea65c038c1ef1a6cedd10f1c">best_result</a>.<a class="code" href="a00477.html#ae39a2c718b010ed27eb7f820546da6d6">sconfidence</a> &gt; 1;
 
617
<a name="l00516"></a>00516 }
 
618
<a name="l00517"></a>00517 
 
619
<a name="l00518"></a>00518 <span class="comment">// Helper method to convert an orientation index to its value in degrees.</span>
 
620
<a name="l00519"></a>00519 <span class="comment">// The value represents the amount of clockwise rotation in degrees that must be</span>
 
621
<a name="l00520"></a>00520 <span class="comment">// applied for the text to be upright (readable).</span>
 
622
<a name="l00521"></a><a class="code" href="a00688.html#a4239adc5aad0a7487a6d414f91fc41b2">00521</a> <span class="keyword">const</span> <span class="keywordtype">int</span> <a class="code" href="a00687.html#a94d19668c76dab0d8ab3832c765303da">OrientationIdToValue</a>(<span class="keyword">const</span> <span class="keywordtype">int</span>&amp; <span class="keywordtype">id</span>) {
 
623
<a name="l00522"></a>00522   <span class="keywordflow">switch</span> (<span class="keywordtype">id</span>) {
 
624
<a name="l00523"></a>00523     <span class="keywordflow">case</span> 0:
 
625
<a name="l00524"></a>00524       <span class="keywordflow">return</span> 0;
 
626
<a name="l00525"></a>00525     <span class="keywordflow">case</span> 1:
 
627
<a name="l00526"></a>00526       <span class="keywordflow">return</span> 270;
 
628
<a name="l00527"></a>00527     <span class="keywordflow">case</span> 2:
 
629
<a name="l00528"></a>00528       <span class="keywordflow">return</span> 180;
 
630
<a name="l00529"></a>00529     <span class="keywordflow">case</span> 3:
 
631
<a name="l00530"></a>00530       <span class="keywordflow">return</span> 90;
 
632
<a name="l00531"></a>00531     <span class="keywordflow">default</span>:
 
633
<a name="l00532"></a>00532       <span class="keywordflow">return</span> -1;
 
634
<a name="l00533"></a>00533   }
 
635
<a name="l00534"></a>00534 }
 
636
</pre></div></div><!-- contents -->
 
637
</div>
 
638
<!-- window showing the filter options -->
 
639
<div id="MSearchSelectWindow"
 
640
     onmouseover="return searchBox.OnSearchSelectShow()"
 
641
     onmouseout="return searchBox.OnSearchSelectHide()"
 
642
     onkeydown="return searchBox.OnSearchSelectKey(event)">
 
643
<a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(0)"><span class="SelectionMark">&#160;</span>All</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(1)"><span class="SelectionMark">&#160;</span>Classes</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(2)"><span class="SelectionMark">&#160;</span>Namespaces</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(3)"><span class="SelectionMark">&#160;</span>Files</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(4)"><span class="SelectionMark">&#160;</span>Functions</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(5)"><span class="SelectionMark">&#160;</span>Variables</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(6)"><span class="SelectionMark">&#160;</span>Typedefs</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(7)"><span class="SelectionMark">&#160;</span>Enumerations</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(8)"><span class="SelectionMark">&#160;</span>Enumerator</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(9)"><span class="SelectionMark">&#160;</span>Friends</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(10)"><span class="SelectionMark">&#160;</span>Defines</a></div>
 
644
 
 
645
<!-- iframe showing the search results (closed by default) -->
 
646
<div id="MSearchResultsWindow">
 
647
<iframe src="javascript:void(0)" frameborder="0" 
 
648
        name="MSearchResults" id="MSearchResults">
 
649
</iframe>
 
650
</div>
 
651
 
 
652
  <div id="nav-path" class="navpath">
 
653
    <ul>
 
654
      <li class="navelem"><a class="el" href="a00687.html">osdetect.cpp</a>      </li>
 
655
 
 
656
    <li class="footer">Generated on Mon Feb 3 2014 10:59:07 for tesseract by
 
657
    <a href="http://www.doxygen.org/index.html">
 
658
    <img class="footer" src="doxygen.png" alt="doxygen"/></a> 1.7.6.1 </li>
 
659
   </ul>
 
660
 </div>
 
661
 
 
662
 
 
663
</body>
 
664
</html>