1
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
2
<html xmlns="http://www.w3.org/1999/xhtml">
4
<meta http-equiv="Content-Type" content="text/xhtml;charset=UTF-8"/>
5
<meta http-equiv="X-UA-Compatible" content="IE=9"/>
6
<title>tesseract: /usr/local/google/home/jbreiden/tesseract-ocr-read-only/ccmain/osdetect.cpp Source File</title>
8
<link href="tabs.css" rel="stylesheet" type="text/css"/>
9
<link href="doxygen.css" rel="stylesheet" type="text/css" />
10
<link href="navtree.css" rel="stylesheet" type="text/css"/>
11
<script type="text/javascript" src="jquery.js"></script>
12
<script type="text/javascript" src="resize.js"></script>
13
<script type="text/javascript" src="navtree.js"></script>
14
<script type="text/javascript">
15
$(document).ready(initResizable);
17
<link href="search/search.css" rel="stylesheet" type="text/css"/>
18
<script type="text/javascript" src="search/search.js"></script>
19
<script type="text/javascript">
20
$(document).ready(function() { searchBox.OnSelectItem(0); });
25
<div id="top"><!-- do not remove this div! -->
29
<table cellspacing="0" cellpadding="0">
31
<tr style="height: 56px;">
34
<td style="padding-left: 0.5em;">
35
<div id="projectname">tesseract
36
 <span id="projectnumber">3.03</span>
48
<!-- Generated by Doxygen 1.7.6.1 -->
49
<script type="text/javascript">
50
var searchBox = new SearchBox("searchBox", "search",false,'Search');
52
<div id="navrow1" class="tabs">
54
<li><a href="index.html"><span>Main Page</span></a></li>
55
<li><a href="pages.html"><span>Related Pages</span></a></li>
56
<li><a href="modules.html"><span>Modules</span></a></li>
57
<li><a href="namespaces.html"><span>Namespaces</span></a></li>
58
<li><a href="annotated.html"><span>Classes</span></a></li>
59
<li class="current"><a href="files.html"><span>Files</span></a></li>
61
<div id="MSearchBox" class="MSearchBoxInactive">
63
<img id="MSearchSelect" src="search/mag_sel.png"
64
onmouseover="return searchBox.OnSearchSelectShow()"
65
onmouseout="return searchBox.OnSearchSelectHide()"
67
<input type="text" id="MSearchField" value="Search" accesskey="S"
68
onfocus="searchBox.OnSearchFieldFocus(true)"
69
onblur="searchBox.OnSearchFieldFocus(false)"
70
onkeyup="searchBox.OnSearchFieldChange(event)"/>
71
</span><span class="right">
72
<a id="MSearchClose" href="javascript:searchBox.CloseResultsWindow()"><img id="MSearchCloseImg" border="0" src="search/close.png" alt=""/></a>
78
<div id="navrow2" class="tabs2">
80
<li><a href="files.html"><span>File List</span></a></li>
81
<li><a href="globals.html"><span>File Members</span></a></li>
85
<div id="side-nav" class="ui-resizable side-nav-resizable">
87
<div id="nav-tree-contents">
90
<div id="splitbar" style="-moz-user-select:none;"
91
class="ui-resizable-handle">
94
<script type="text/javascript">
95
initNavTree('a00687.html','');
97
<div id="doc-content">
99
<div class="headertitle">
100
<div class="title">/usr/local/google/home/jbreiden/tesseract-ocr-read-only/ccmain/osdetect.cpp</div> </div>
102
<div class="contents">
103
<a href="a00687.html">Go to the documentation of this file.</a><div class="fragment"><pre class="fragment"><a name="l00001"></a>00001
104
<a name="l00002"></a>00002 <span class="comment">// File: osdetect.cpp</span>
105
<a name="l00003"></a>00003 <span class="comment">// Description: Orientation and script detection.</span>
106
<a name="l00004"></a>00004 <span class="comment">// Author: Samuel Charron</span>
107
<a name="l00005"></a>00005 <span class="comment">// Ranjith Unnikrishnan</span>
108
<a name="l00006"></a>00006 <span class="comment">//</span>
109
<a name="l00007"></a>00007 <span class="comment">// (C) Copyright 2008, Google Inc.</span>
110
<a name="l00008"></a>00008 <span class="comment">// Licensed under the Apache License, Version 2.0 (the "License");</span>
111
<a name="l00009"></a>00009 <span class="comment">// you may not use this file except in compliance with the License.</span>
112
<a name="l00010"></a>00010 <span class="comment">// You may obtain a copy of the License at</span>
113
<a name="l00011"></a>00011 <span class="comment">// http://www.apache.org/licenses/LICENSE-2.0</span>
114
<a name="l00012"></a>00012 <span class="comment">// Unless required by applicable law or agreed to in writing, software</span>
115
<a name="l00013"></a>00013 <span class="comment">// distributed under the License is distributed on an "AS IS" BASIS,</span>
116
<a name="l00014"></a>00014 <span class="comment">// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.</span>
117
<a name="l00015"></a>00015 <span class="comment">// See the License for the specific language governing permissions and</span>
118
<a name="l00016"></a>00016 <span class="comment">// limitations under the License.</span>
119
<a name="l00017"></a>00017 <span class="comment">//</span>
120
<a name="l00019"></a>00019 <span class="comment"></span>
121
<a name="l00020"></a>00020 <span class="preprocessor">#include "<a class="code" href="a00688.html">osdetect.h</a>"</span>
122
<a name="l00021"></a>00021
123
<a name="l00022"></a>00022 <span class="preprocessor">#include "<a class="code" href="a00728.html">blobbox.h</a>"</span>
124
<a name="l00023"></a>00023 <span class="preprocessor">#include "<a class="code" href="a00732.html">blread.h</a>"</span>
125
<a name="l00024"></a>00024 <span class="preprocessor">#include "<a class="code" href="a01099.html">colfind.h</a>"</span>
126
<a name="l00025"></a>00025 <span class="preprocessor">#include "<a class="code" href="a00747.html">fontinfo.h</a>"</span>
127
<a name="l00026"></a>00026 <span class="preprocessor">#include "<a class="code" href="a01123.html">imagefind.h</a>"</span>
128
<a name="l00027"></a>00027 <span class="preprocessor">#include "<a class="code" href="a01125.html">linefind.h</a>"</span>
129
<a name="l00028"></a>00028 <span class="preprocessor">#include "<a class="code" href="a01043.html">oldlist.h</a>"</span>
130
<a name="l00029"></a>00029 <span class="preprocessor">#include "<a class="code" href="a00846.html">qrsequence.h</a>"</span>
131
<a name="l00030"></a>00030 <span class="preprocessor">#include "<a class="code" href="a00788.html">ratngs.h</a>"</span>
132
<a name="l00031"></a>00031 <span class="preprocessor">#include "<a class="code" href="a00855.html">strngs.h</a>"</span>
133
<a name="l00032"></a>00032 <span class="preprocessor">#include "<a class="code" href="a01147.html">tabvector.h</a>"</span>
134
<a name="l00033"></a>00033 <span class="preprocessor">#include "<a class="code" href="a00716.html">tesseractclass.h</a>"</span>
135
<a name="l00034"></a>00034 <span class="preprocessor">#include "<a class="code" href="a01151.html">textord.h</a>"</span>
136
<a name="l00035"></a>00035
137
<a name="l00036"></a><a class="code" href="a00687.html#a1dcbb4454cb6c97be113fc6ae820c958">00036</a> <span class="keyword">const</span> <span class="keywordtype">int</span> <a class="code" href="a00687.html#a1dcbb4454cb6c97be113fc6ae820c958">kMinCharactersToTry</a> = 50;
138
<a name="l00037"></a><a class="code" href="a00687.html#ab1eb3d41a8092b2cc34e2c1d17886521">00037</a> <span class="keyword">const</span> <span class="keywordtype">int</span> <a class="code" href="a00687.html#ab1eb3d41a8092b2cc34e2c1d17886521">kMaxCharactersToTry</a> = 5 * <a class="code" href="a00687.html#a1dcbb4454cb6c97be113fc6ae820c958">kMinCharactersToTry</a>;
139
<a name="l00038"></a>00038
140
<a name="l00039"></a><a class="code" href="a00687.html#ac23eec99b25d1c109fb6ee2590a331bf">00039</a> <span class="keyword">const</span> <span class="keywordtype">float</span> <a class="code" href="a00687.html#ac23eec99b25d1c109fb6ee2590a331bf">kSizeRatioToReject</a> = 2.0;
141
<a name="l00040"></a><a class="code" href="a00687.html#aaba53b59683a4788881c7b8281f25fac">00040</a> <span class="keyword">const</span> <span class="keywordtype">int</span> <a class="code" href="a00687.html#aaba53b59683a4788881c7b8281f25fac">kMinAcceptableBlobHeight</a> = 10;
142
<a name="l00041"></a>00041
143
<a name="l00042"></a><a class="code" href="a00687.html#ad58ecd1e0aa2241ba3ccd5d0398c1e5c">00042</a> <span class="keyword">const</span> <span class="keywordtype">float</span> <a class="code" href="a00687.html#ad58ecd1e0aa2241ba3ccd5d0398c1e5c">kOrientationAcceptRatio</a> = 1.3;
144
<a name="l00043"></a><a class="code" href="a00687.html#a448b61b7951bc14ffab3cc00ba37aadd">00043</a> <span class="keyword">const</span> <span class="keywordtype">float</span> <a class="code" href="a00687.html#a448b61b7951bc14ffab3cc00ba37aadd">kScriptAcceptRatio</a> = 1.3;
145
<a name="l00044"></a>00044
146
<a name="l00045"></a><a class="code" href="a00687.html#ae3f12edb58f6ed0a11daea2cbf8dc547">00045</a> <span class="keyword">const</span> <span class="keywordtype">float</span> <a class="code" href="a00687.html#ae3f12edb58f6ed0a11daea2cbf8dc547">kHanRatioInKorean</a> = 0.7;
147
<a name="l00046"></a><a class="code" href="a00687.html#aab3b7e76eea520b1e4b9d68165e3a094">00046</a> <span class="keyword">const</span> <span class="keywordtype">float</span> <a class="code" href="a00687.html#aab3b7e76eea520b1e4b9d68165e3a094">kHanRatioInJapanese</a> = 0.3;
148
<a name="l00047"></a>00047
149
<a name="l00048"></a><a class="code" href="a00687.html#a14c7913eafbd3237afbdd7c6b498b2d8">00048</a> <span class="keyword">const</span> <span class="keywordtype">float</span> <a class="code" href="a00687.html#a14c7913eafbd3237afbdd7c6b498b2d8">kNonAmbiguousMargin</a> = 1.0;
150
<a name="l00049"></a>00049
151
<a name="l00050"></a>00050 <span class="comment">// General scripts</span>
152
<a name="l00051"></a>00051 <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">char</span>* han_script = <span class="stringliteral">"Han"</span>;
153
<a name="l00052"></a>00052 <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">char</span>* latin_script = <span class="stringliteral">"Latin"</span>;
154
<a name="l00053"></a>00053 <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">char</span>* katakana_script = <span class="stringliteral">"Katakana"</span>;
155
<a name="l00054"></a>00054 <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">char</span>* hiragana_script = <span class="stringliteral">"Hiragana"</span>;
156
<a name="l00055"></a>00055 <span class="keyword">static</span> <span class="keyword">const</span> <span class="keywordtype">char</span>* hangul_script = <span class="stringliteral">"Hangul"</span>;
157
<a name="l00056"></a>00056
158
<a name="l00057"></a>00057 <span class="comment">// Pseudo-scripts Name</span>
159
<a name="l00058"></a>00058 <span class="keyword">const</span> <span class="keywordtype">char</span>* ScriptDetector::korean_script_ = <span class="stringliteral">"Korean"</span>;
160
<a name="l00059"></a>00059 <span class="keyword">const</span> <span class="keywordtype">char</span>* ScriptDetector::japanese_script_ = <span class="stringliteral">"Japanese"</span>;
161
<a name="l00060"></a>00060 <span class="keyword">const</span> <span class="keywordtype">char</span>* ScriptDetector::fraktur_script_ = <span class="stringliteral">"Fraktur"</span>;
162
<a name="l00061"></a>00061
163
<a name="l00062"></a>00062 <span class="comment">// Minimum believable resolution.</span>
164
<a name="l00063"></a><a class="code" href="a00687.html#af9f4de4278c712c02788092501b587f3">00063</a> <span class="keyword">const</span> <span class="keywordtype">int</span> <a class="code" href="a00687.html#af9f4de4278c712c02788092501b587f3">kMinCredibleResolution</a> = 70;
165
<a name="l00064"></a>00064 <span class="comment">// Default resolution used if input is not believable.</span>
166
<a name="l00065"></a><a class="code" href="a00687.html#ad3674a322dd444a002052c5b929b1976">00065</a> <span class="keyword">const</span> <span class="keywordtype">int</span> <a class="code" href="a00687.html#ad3674a322dd444a002052c5b929b1976">kDefaultResolution</a> = 300;
167
<a name="l00066"></a>00066
168
<a name="l00067"></a><a class="code" href="a00478.html#af7b5cea89a2bdace52ad5825d6d5d4e6">00067</a> <span class="keywordtype">void</span> <a class="code" href="a00478.html#af7b5cea89a2bdace52ad5825d6d5d4e6">OSResults::update_best_orientation</a>() {
169
<a name="l00068"></a>00068 <span class="keywordtype">float</span> first = <a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[0];
170
<a name="l00069"></a>00069 <span class="keywordtype">float</span> second = <a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[1];
171
<a name="l00070"></a>00070 <a class="code" href="a00478.html#a25f64011ea65c038c1ef1a6cedd10f1c">best_result</a>.<a class="code" href="a00477.html#a6dfb6826b41a81524ce867b005ba5641">orientation_id</a> = 0;
172
<a name="l00071"></a>00071 <span class="keywordflow">if</span> (<a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[0] < <a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[1]) {
173
<a name="l00072"></a>00072 first = <a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[1];
174
<a name="l00073"></a>00073 second = <a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[0];
175
<a name="l00074"></a>00074 <a class="code" href="a00478.html#a25f64011ea65c038c1ef1a6cedd10f1c">best_result</a>.<a class="code" href="a00477.html#a6dfb6826b41a81524ce867b005ba5641">orientation_id</a> = 1;
176
<a name="l00075"></a>00075 }
177
<a name="l00076"></a>00076 <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 2; i < 4; ++i) {
178
<a name="l00077"></a>00077 <span class="keywordflow">if</span> (<a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[i] > first) {
179
<a name="l00078"></a>00078 second = first;
180
<a name="l00079"></a>00079 first = <a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[i];
181
<a name="l00080"></a>00080 <a class="code" href="a00478.html#a25f64011ea65c038c1ef1a6cedd10f1c">best_result</a>.<a class="code" href="a00477.html#a6dfb6826b41a81524ce867b005ba5641">orientation_id</a> = i;
182
<a name="l00081"></a>00081 } <span class="keywordflow">else</span> <span class="keywordflow">if</span> (<a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[i] > second) {
183
<a name="l00082"></a>00082 second = <a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[i];
184
<a name="l00083"></a>00083 }
185
<a name="l00084"></a>00084 }
186
<a name="l00085"></a>00085 <span class="comment">// Store difference of top two orientation scores.</span>
187
<a name="l00086"></a>00086 <a class="code" href="a00478.html#a25f64011ea65c038c1ef1a6cedd10f1c">best_result</a>.<a class="code" href="a00477.html#a67e009467e4db6c40777548ffdfe464e">oconfidence</a> = first - second;
188
<a name="l00087"></a>00087 }
189
<a name="l00088"></a>00088
190
<a name="l00089"></a><a class="code" href="a00478.html#aa13f0e8c136d10e0af341f163951ed3d">00089</a> <span class="keywordtype">void</span> <a class="code" href="a00478.html#aa13f0e8c136d10e0af341f163951ed3d">OSResults::set_best_orientation</a>(<span class="keywordtype">int</span> orientation_id) {
191
<a name="l00090"></a>00090 <a class="code" href="a00478.html#a25f64011ea65c038c1ef1a6cedd10f1c">best_result</a>.<a class="code" href="a00477.html#a6dfb6826b41a81524ce867b005ba5641">orientation_id</a> = orientation_id;
192
<a name="l00091"></a>00091 <a class="code" href="a00478.html#a25f64011ea65c038c1ef1a6cedd10f1c">best_result</a>.<a class="code" href="a00477.html#a67e009467e4db6c40777548ffdfe464e">oconfidence</a> = 0;
193
<a name="l00092"></a>00092 }
194
<a name="l00093"></a>00093
195
<a name="l00094"></a><a class="code" href="a00478.html#ab796da60cc16d39f464c03fe4047c358">00094</a> <span class="keywordtype">void</span> <a class="code" href="a00478.html#ab796da60cc16d39f464c03fe4047c358">OSResults::update_best_script</a>(<span class="keywordtype">int</span> orientation) {
196
<a name="l00095"></a>00095 <span class="comment">// We skip index 0 to ignore the "Common" script.</span>
197
<a name="l00096"></a>00096 <span class="keywordtype">float</span> first = <a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation][1];
198
<a name="l00097"></a>00097 <span class="keywordtype">float</span> second = <a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation][2];
199
<a name="l00098"></a>00098 <a class="code" href="a00478.html#a25f64011ea65c038c1ef1a6cedd10f1c">best_result</a>.<a class="code" href="a00477.html#a0647ea3dc4a399a472c48ab1eacd31e1">script_id</a> = 1;
200
<a name="l00099"></a>00099 <span class="keywordflow">if</span> (<a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation][1] < <a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation][2]) {
201
<a name="l00100"></a>00100 first = <a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation][2];
202
<a name="l00101"></a>00101 second = <a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation][1];
203
<a name="l00102"></a>00102 <a class="code" href="a00478.html#a25f64011ea65c038c1ef1a6cedd10f1c">best_result</a>.<a class="code" href="a00477.html#a0647ea3dc4a399a472c48ab1eacd31e1">script_id</a> = 2;
204
<a name="l00103"></a>00103 }
205
<a name="l00104"></a>00104 <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 3; i < <a class="code" href="a00688.html#ab52d878a730b63bcf57d7bb3113882a1">kMaxNumberOfScripts</a>; ++i) {
206
<a name="l00105"></a>00105 <span class="keywordflow">if</span> (<a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation][i] > first) {
207
<a name="l00106"></a>00106 <a class="code" href="a00478.html#a25f64011ea65c038c1ef1a6cedd10f1c">best_result</a>.<a class="code" href="a00477.html#a0647ea3dc4a399a472c48ab1eacd31e1">script_id</a> = i;
208
<a name="l00107"></a>00107 second = first;
209
<a name="l00108"></a>00108 first = <a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation][i];
210
<a name="l00109"></a>00109 } <span class="keywordflow">else</span> <span class="keywordflow">if</span> (<a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation][i] > second) {
211
<a name="l00110"></a>00110 second = <a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation][i];
212
<a name="l00111"></a>00111 }
213
<a name="l00112"></a>00112 }
214
<a name="l00113"></a>00113 <a class="code" href="a00478.html#a25f64011ea65c038c1ef1a6cedd10f1c">best_result</a>.<a class="code" href="a00477.html#ae39a2c718b010ed27eb7f820546da6d6">sconfidence</a> =
215
<a name="l00114"></a>00114 (first / second - 1.0) / (<a class="code" href="a00687.html#a448b61b7951bc14ffab3cc00ba37aadd">kScriptAcceptRatio</a> - 1.0);
216
<a name="l00115"></a>00115 }
217
<a name="l00116"></a>00116
218
<a name="l00117"></a><a class="code" href="a00478.html#a9dcb5250ae2466116c33f5d220223296">00117</a> <span class="keywordtype">int</span> <a class="code" href="a00478.html#a9dcb5250ae2466116c33f5d220223296">OSResults::get_best_script</a>(<span class="keywordtype">int</span> orientation_id)<span class="keyword"> const </span>{
219
<a name="l00118"></a>00118 <span class="keywordtype">int</span> max_id = -1;
220
<a name="l00119"></a>00119 <span class="keywordflow">for</span> (<span class="keywordtype">int</span> j = 0; j < <a class="code" href="a00688.html#ab52d878a730b63bcf57d7bb3113882a1">kMaxNumberOfScripts</a>; ++j) {
221
<a name="l00120"></a>00120 <span class="keyword">const</span> <span class="keywordtype">char</span> *script = <a class="code" href="a00478.html#a78ebdae52f3c685095b56790598ad97c">unicharset</a>-><a class="code" href="a00642.html#a4fc0f6815e2091efedcff7ab6183d19a">get_script_from_script_id</a>(j);
222
<a name="l00121"></a>00121 <span class="keywordflow">if</span> (strcmp(script, <span class="stringliteral">"Common"</span>) && strcmp(script, <span class="stringliteral">"NULL"</span>)) {
223
<a name="l00122"></a>00122 <span class="keywordflow">if</span> (max_id == -1 ||
224
<a name="l00123"></a>00123 <a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation_id][j] > <a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation_id][max_id])
225
<a name="l00124"></a>00124 max_id = j;
226
<a name="l00125"></a>00125 }
227
<a name="l00126"></a>00126 }
228
<a name="l00127"></a>00127 <span class="keywordflow">return</span> max_id;
229
<a name="l00128"></a>00128 }
230
<a name="l00129"></a>00129
231
<a name="l00130"></a>00130 <span class="comment">// Print the script scores for all possible orientations.</span>
232
<a name="l00131"></a><a class="code" href="a00478.html#a4425aefc39fde345cea1288d95691bed">00131</a> <span class="keywordtype">void</span> <a class="code" href="a00478.html#a4425aefc39fde345cea1288d95691bed">OSResults::print_scores</a>(<span class="keywordtype">void</span>)<span class="keyword"> const </span>{
233
<a name="l00132"></a>00132 <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 0; i < 4; ++i) {
234
<a name="l00133"></a>00133 <a class="code" href="a00860.html#a02aa7cca2c3857c14716e8cca96ace6c">tprintf</a>(<span class="stringliteral">"Orientation id #%d"</span>, i);
235
<a name="l00134"></a>00134 <a class="code" href="a00478.html#a4425aefc39fde345cea1288d95691bed">print_scores</a>(i);
236
<a name="l00135"></a>00135 }
237
<a name="l00136"></a>00136 }
238
<a name="l00137"></a>00137
239
<a name="l00138"></a>00138 <span class="comment">// Print the script scores for the given candidate orientation.</span>
240
<a name="l00139"></a><a class="code" href="a00478.html#a4c4c5d0fce6889edeea358f755f7e378">00139</a> <span class="keywordtype">void</span> <a class="code" href="a00478.html#a4425aefc39fde345cea1288d95691bed">OSResults::print_scores</a>(<span class="keywordtype">int</span> orientation_id)<span class="keyword"> const </span>{
241
<a name="l00140"></a>00140 <span class="keywordflow">for</span> (<span class="keywordtype">int</span> j = 0; j < <a class="code" href="a00688.html#ab52d878a730b63bcf57d7bb3113882a1">kMaxNumberOfScripts</a>; ++j) {
242
<a name="l00141"></a>00141 <span class="keywordflow">if</span> (<a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation_id][j]) {
243
<a name="l00142"></a>00142 <a class="code" href="a00860.html#a02aa7cca2c3857c14716e8cca96ace6c">tprintf</a>(<span class="stringliteral">"%12s\t: %f\n"</span>, <a class="code" href="a00478.html#a78ebdae52f3c685095b56790598ad97c">unicharset</a>-><a class="code" href="a00642.html#a4fc0f6815e2091efedcff7ab6183d19a">get_script_from_script_id</a>(j),
244
<a name="l00143"></a>00143 <a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[orientation_id][j]);
245
<a name="l00144"></a>00144 }
246
<a name="l00145"></a>00145 }
247
<a name="l00146"></a>00146 }
248
<a name="l00147"></a>00147
249
<a name="l00148"></a>00148 <span class="comment">// Accumulate scores with given OSResults instance and update the best script.</span>
250
<a name="l00149"></a><a class="code" href="a00478.html#a25b4edef21699b3a367d7978733595be">00149</a> <span class="keywordtype">void</span> <a class="code" href="a00478.html#a25b4edef21699b3a367d7978733595be">OSResults::accumulate</a>(<span class="keyword">const</span> <a class="code" href="a00478.html">OSResults</a>& osr) {
251
<a name="l00150"></a>00150 <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 0; i < 4; ++i) {
252
<a name="l00151"></a>00151 <a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[i] += osr.<a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[i];
253
<a name="l00152"></a>00152 <span class="keywordflow">for</span> (<span class="keywordtype">int</span> j = 0; j < <a class="code" href="a00688.html#ab52d878a730b63bcf57d7bb3113882a1">kMaxNumberOfScripts</a>; ++j)
254
<a name="l00153"></a>00153 <a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[i][j] += osr.<a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[i][j];
255
<a name="l00154"></a>00154 }
256
<a name="l00155"></a>00155 <a class="code" href="a00478.html#a78ebdae52f3c685095b56790598ad97c">unicharset</a> = osr.<a class="code" href="a00478.html#a78ebdae52f3c685095b56790598ad97c">unicharset</a>;
257
<a name="l00156"></a>00156 <a class="code" href="a00478.html#af7b5cea89a2bdace52ad5825d6d5d4e6">update_best_orientation</a>();
258
<a name="l00157"></a>00157 <a class="code" href="a00478.html#ab796da60cc16d39f464c03fe4047c358">update_best_script</a>(<a class="code" href="a00478.html#a25f64011ea65c038c1ef1a6cedd10f1c">best_result</a>.<a class="code" href="a00477.html#a6dfb6826b41a81524ce867b005ba5641">orientation_id</a>);
259
<a name="l00158"></a>00158 }
260
<a name="l00159"></a>00159
261
<a name="l00160"></a>00160 <span class="comment">// Detect and erase horizontal/vertical lines and picture regions from the</span>
262
<a name="l00161"></a>00161 <span class="comment">// image, so that non-text blobs are removed from consideration.</span>
263
<a name="l00162"></a><a class="code" href="a00687.html#a0328b8314a9022034d90c11ac8a0b0ea">00162</a> <span class="keywordtype">void</span> <a class="code" href="a00687.html#a0328b8314a9022034d90c11ac8a0b0ea">remove_nontext_regions</a>(<a class="code" href="a00607.html">tesseract::Tesseract</a> *tess, BLOCK_LIST *blocks,
264
<a name="l00163"></a>00163 TO_BLOCK_LIST *to_blocks) {
265
<a name="l00164"></a>00164 Pix *pix = tess-><a class="code" href="a00607.html#a97fde2a457aa76137737b247a2418cb7">pix_binary</a>();
266
<a name="l00165"></a>00165 <a class="code" href="a00823.html#a93a603f4063a6b9403d81caa245a583b">ASSERT_HOST</a>(pix != NULL);
267
<a name="l00166"></a>00166 <span class="keywordtype">int</span> vertical_x = 0;
268
<a name="l00167"></a>00167 <span class="keywordtype">int</span> vertical_y = 1;
269
<a name="l00168"></a>00168 tesseract::TabVector_LIST v_lines;
270
<a name="l00169"></a>00169 tesseract::TabVector_LIST h_lines;
271
<a name="l00170"></a>00170 <span class="keyword">const</span> <span class="keywordtype">int</span> <a class="code" href="a00687.html#af9f4de4278c712c02788092501b587f3">kMinCredibleResolution</a> = 70;
272
<a name="l00171"></a>00171 <span class="keywordtype">int</span> resolution = (kMinCredibleResolution > pixGetXRes(pix)) ?
273
<a name="l00172"></a>00172 kMinCredibleResolution : pixGetXRes(pix);
274
<a name="l00173"></a>00173
275
<a name="l00174"></a>00174 <a class="code" href="a00451.html#a3a72521c00cb7725b2282b7b3cc6e6b9">tesseract::LineFinder::FindAndRemoveLines</a>(resolution, <span class="keyword">false</span>, pix,
276
<a name="l00175"></a>00175 &vertical_x, &vertical_y,
277
<a name="l00176"></a>00176 NULL, &v_lines, &h_lines);
278
<a name="l00177"></a>00177 Pix* im_pix = <a class="code" href="a00413.html#af465be1a567090dcaaa74eb7742c51fe">tesseract::ImageFind::FindImages</a>(pix);
279
<a name="l00178"></a>00178 <span class="keywordflow">if</span> (im_pix != NULL) {
280
<a name="l00179"></a>00179 pixSubtract(pix, pix, im_pix);
281
<a name="l00180"></a>00180 pixDestroy(&im_pix);
282
<a name="l00181"></a>00181 }
283
<a name="l00182"></a>00182 tess-><a class="code" href="a00607.html#a6fa77152d6fd5c6afe14f2698413d0f9">mutable_textord</a>()-><a class="code" href="a00625.html#ab478029b49bf4efadd59a547565327a7">find_components</a>(tess-><a class="code" href="a00607.html#a97fde2a457aa76137737b247a2418cb7">pix_binary</a>(),
284
<a name="l00183"></a>00183 blocks, to_blocks);
285
<a name="l00184"></a>00184 }
286
<a name="l00185"></a>00185
287
<a name="l00186"></a>00186 <span class="comment">// Find connected components in the page and process a subset until finished or</span>
288
<a name="l00187"></a>00187 <span class="comment">// a stopping criterion is met.</span>
289
<a name="l00188"></a>00188 <span class="comment">// Returns the number of blobs used in making the estimate. 0 implies failure.</span>
290
<a name="l00189"></a><a class="code" href="a00688.html#af7ea57b0e1847f524c98576cb5cace43">00189</a> <span class="keywordtype">int</span> <a class="code" href="a00687.html#aec0e2284de8927ea9f29b61ff30d052a">orientation_and_script_detection</a>(<a class="code" href="a00557.html">STRING</a>& <a class="code" href="a01266.html#a61c02c0afc996e6b9c619f0a757af50b">filename</a>,
291
<a name="l00190"></a>00190 <a class="code" href="a00478.html">OSResults</a>* osr,
292
<a name="l00191"></a>00191 <a class="code" href="a00607.html">tesseract::Tesseract</a>* tess) {
293
<a name="l00192"></a>00192 <a class="code" href="a00557.html">STRING</a> name = <a class="code" href="a01266.html#a61c02c0afc996e6b9c619f0a757af50b">filename</a>; <span class="comment">//truncated name</span>
294
<a name="l00193"></a>00193 <span class="keyword">const</span> <span class="keywordtype">char</span> *lastdot; <span class="comment">//of name</span>
295
<a name="l00194"></a>00194 <a class="code" href="a00592.html">TBOX</a> page_box;
296
<a name="l00195"></a>00195
297
<a name="l00196"></a>00196 lastdot = strrchr (name.<a class="code" href="a00557.html#a32beee43ecab1bed8bebc3466896ad6e">string</a> (), <span class="charliteral">'.'</span>);
298
<a name="l00197"></a>00197 <span class="keywordflow">if</span> (lastdot != NULL)
299
<a name="l00198"></a>00198 name[lastdot-name.<a class="code" href="a00557.html#a32beee43ecab1bed8bebc3466896ad6e">string</a>()] = <span class="charliteral">'\0'</span>;
300
<a name="l00199"></a>00199
301
<a name="l00200"></a>00200 <a class="code" href="a00823.html#a93a603f4063a6b9403d81caa245a583b">ASSERT_HOST</a>(tess-><a class="code" href="a00607.html#a97fde2a457aa76137737b247a2418cb7">pix_binary</a>() != NULL)
302
<a name="l00201"></a>00201 <span class="keywordtype">int</span> width = pixGetWidth(tess-><a class="code" href="a00607.html#a97fde2a457aa76137737b247a2418cb7">pix_binary</a>());
303
<a name="l00202"></a>00202 <span class="keywordtype">int</span> height = pixGetHeight(tess-><a class="code" href="a00607.html#a97fde2a457aa76137737b247a2418cb7">pix_binary</a>());
304
<a name="l00203"></a>00203 <span class="keywordtype">int</span> resolution = pixGetXRes(tess-><a class="code" href="a00607.html#a97fde2a457aa76137737b247a2418cb7">pix_binary</a>());
305
<a name="l00204"></a>00204 <span class="comment">// Zero resolution messes up the algorithms, so make sure it is credible.</span>
306
<a name="l00205"></a>00205 <span class="keywordflow">if</span> (resolution < <a class="code" href="a00687.html#af9f4de4278c712c02788092501b587f3">kMinCredibleResolution</a>)
307
<a name="l00206"></a>00206 resolution = <a class="code" href="a00687.html#ad3674a322dd444a002052c5b929b1976">kDefaultResolution</a>;
308
<a name="l00207"></a>00207
309
<a name="l00208"></a>00208 BLOCK_LIST blocks;
310
<a name="l00209"></a>00209 <span class="keywordflow">if</span> (!<a class="code" href="a00731.html#ab65373023a95c3043ea26b7906e29907">read_unlv_file</a>(name, width, height, &blocks))
311
<a name="l00210"></a>00210 <a class="code" href="a00731.html#a6d4d883ff45201c5b6166b5941cb96a2">FullPageBlock</a>(width, height, &blocks);
312
<a name="l00211"></a>00211
313
<a name="l00212"></a>00212 <span class="comment">// Try to remove non-text regions from consideration.</span>
314
<a name="l00213"></a>00213 TO_BLOCK_LIST land_blocks, port_blocks;
315
<a name="l00214"></a>00214 <a class="code" href="a00687.html#a0328b8314a9022034d90c11ac8a0b0ea">remove_nontext_regions</a>(tess, &blocks, &port_blocks);
316
<a name="l00215"></a>00215
317
<a name="l00216"></a>00216 <span class="keywordflow">if</span> (port_blocks.empty()) {
318
<a name="l00217"></a>00217 <span class="comment">// page segmentation did not succeed, so we need to find_components first.</span>
319
<a name="l00218"></a>00218 tess-><a class="code" href="a00607.html#a6fa77152d6fd5c6afe14f2698413d0f9">mutable_textord</a>()-><a class="code" href="a00625.html#ab478029b49bf4efadd59a547565327a7">find_components</a>(tess-><a class="code" href="a00607.html#a97fde2a457aa76137737b247a2418cb7">pix_binary</a>(),
320
<a name="l00219"></a>00219 &blocks, &port_blocks);
321
<a name="l00220"></a>00220 } <span class="keywordflow">else</span> {
322
<a name="l00221"></a>00221 page_box.<a class="code" href="a00592.html#ae6151cd794841e100d8a346a0c4a46e6">set_left</a>(0);
323
<a name="l00222"></a>00222 page_box.<a class="code" href="a00592.html#a6f803b24b046883cb0f3882dc3d92302">set_bottom</a>(0);
324
<a name="l00223"></a>00223 page_box.<a class="code" href="a00592.html#a2246293d3667b28c52a52353a2d5caea">set_right</a>(width);
325
<a name="l00224"></a>00224 page_box.<a class="code" href="a00592.html#a7f40dfd290a907200bdc98c196f63f45">set_top</a>(height);
326
<a name="l00225"></a>00225 <span class="comment">// Filter_blobs sets up the TO_BLOCKs the same as find_components does.</span>
327
<a name="l00226"></a>00226 tess-><a class="code" href="a00607.html#a6fa77152d6fd5c6afe14f2698413d0f9">mutable_textord</a>()-><a class="code" href="a00625.html#acaed60ac5b5ef00751e3d307347aa0e9">filter_blobs</a>(page_box.<a class="code" href="a00592.html#a02511fc69b598b332ac1f4af6c943f8f">topright</a>(),
328
<a name="l00227"></a>00227 &port_blocks, <span class="keyword">true</span>);
329
<a name="l00228"></a>00228 }
330
<a name="l00229"></a>00229
331
<a name="l00230"></a>00230 <span class="keywordflow">return</span> <a class="code" href="a00687.html#a93fedb9cccbbcf81d3433b95bbc46bdd">os_detect</a>(&port_blocks, osr, tess);
332
<a name="l00231"></a>00231 }
333
<a name="l00232"></a>00232
334
<a name="l00233"></a>00233 <span class="comment">// Filter and sample the blobs.</span>
335
<a name="l00234"></a>00234 <span class="comment">// Returns a non-zero number of blobs if the page was successfully processed, or</span>
336
<a name="l00235"></a>00235 <span class="comment">// zero if the page had too few characters to be reliable</span>
337
<a name="l00236"></a><a class="code" href="a00688.html#a93fedb9cccbbcf81d3433b95bbc46bdd">00236</a> <span class="keywordtype">int</span> <a class="code" href="a00687.html#a93fedb9cccbbcf81d3433b95bbc46bdd">os_detect</a>(TO_BLOCK_LIST* port_blocks, <a class="code" href="a00478.html">OSResults</a>* osr,
338
<a name="l00237"></a>00237 <a class="code" href="a00607.html">tesseract::Tesseract</a>* tess) {
339
<a name="l00238"></a>00238 <span class="keywordtype">int</span> blobs_total = 0;
340
<a name="l00239"></a>00239 TO_BLOCK_IT block_it;
341
<a name="l00240"></a>00240 block_it.set_to_list(port_blocks);
342
<a name="l00241"></a>00241
343
<a name="l00242"></a>00242 BLOBNBOX_CLIST filtered_list;
344
<a name="l00243"></a>00243 BLOBNBOX_C_IT filtered_it(&filtered_list);
345
<a name="l00244"></a>00244
346
<a name="l00245"></a>00245 <span class="keywordflow">for</span> (block_it.mark_cycle_pt(); !block_it.cycled_list();
347
<a name="l00246"></a>00246 block_it.forward ()) {
348
<a name="l00247"></a>00247 <a class="code" href="a00627.html">TO_BLOCK</a>* to_block = block_it.data();
349
<a name="l00248"></a>00248 <span class="keywordflow">if</span> (to_block-><a class="code" href="a00627.html#a16e698664028b0d6d2193db64560c16b">block</a>-><a class="code" href="a00500.html#a6670779c69aca2d574e4a0590d9b3939">poly_block</a>() &&
350
<a name="l00249"></a>00249 !to_block-><a class="code" href="a00627.html#a16e698664028b0d6d2193db64560c16b">block</a>-><a class="code" href="a00500.html#a6670779c69aca2d574e4a0590d9b3939">poly_block</a>()-><a class="code" href="a00505.html#abd32dee532afe634cdbacffc0b53e660">IsText</a>()) <span class="keywordflow">continue</span>;
351
<a name="l00250"></a>00250 BLOBNBOX_IT bbox_it;
352
<a name="l00251"></a>00251 bbox_it.set_to_list(&to_block-><a class="code" href="a00627.html#a5dd67c54162a6b60b0fd11500d4a3025">blobs</a>);
353
<a name="l00252"></a>00252 <span class="keywordflow">for</span> (bbox_it.mark_cycle_pt (); !bbox_it.cycled_list ();
354
<a name="l00253"></a>00253 bbox_it.forward ()) {
355
<a name="l00254"></a>00254 <a class="code" href="a00279.html">BLOBNBOX</a>* bbox = bbox_it.data();
356
<a name="l00255"></a>00255 <a class="code" href="a00289.html">C_BLOB</a>* blob = bbox-><a class="code" href="a00279.html#a483f44541a4dd818f02225c92f030e07">cblob</a>();
357
<a name="l00256"></a>00256 <a class="code" href="a00592.html">TBOX</a> box = blob-><a class="code" href="a00289.html#a77e52e29e2c622a3a63bb7edb110f6ab">bounding_box</a>();
358
<a name="l00257"></a>00257 ++blobs_total;
359
<a name="l00258"></a>00258
360
<a name="l00259"></a>00259 <span class="keywordtype">float</span> y_x = fabs((box.<a class="code" href="a00592.html#a8379d4bbc72bdbb1f069fc14790e632d">height</a>() * 1.0) / box.<a class="code" href="a00592.html#af95494a2ccacc70cc2b83820b2948619">width</a>());
361
<a name="l00260"></a>00260 <span class="keywordtype">float</span> x_y = 1.0f / y_x;
362
<a name="l00261"></a>00261 <span class="comment">// Select a >= 1.0 ratio</span>
363
<a name="l00262"></a>00262 <span class="keywordtype">float</span> ratio = x_y > y_x ? x_y : y_x;
364
<a name="l00263"></a>00263 <span class="comment">// Blob is ambiguous</span>
365
<a name="l00264"></a>00264 <span class="keywordflow">if</span> (ratio > <a class="code" href="a00687.html#ac23eec99b25d1c109fb6ee2590a331bf">kSizeRatioToReject</a>) <span class="keywordflow">continue</span>;
366
<a name="l00265"></a>00265 <span class="keywordflow">if</span> (box.<a class="code" href="a00592.html#a8379d4bbc72bdbb1f069fc14790e632d">height</a>() < <a class="code" href="a00687.html#aaba53b59683a4788881c7b8281f25fac">kMinAcceptableBlobHeight</a>) <span class="keywordflow">continue</span>;
367
<a name="l00266"></a>00266 filtered_it.add_to_end(bbox);
368
<a name="l00267"></a>00267 }
369
<a name="l00268"></a>00268 }
370
<a name="l00269"></a>00269 <span class="keywordflow">return</span> <a class="code" href="a00687.html#a1007e747656418b79d4ce9f8f14f2a7b">os_detect_blobs</a>(&filtered_list, osr, tess);
371
<a name="l00270"></a>00270 }
372
<a name="l00271"></a>00271
373
<a name="l00272"></a>00272 <span class="comment">// Detect orientation and script from a list of blobs.</span>
374
<a name="l00273"></a>00273 <span class="comment">// Returns a non-zero number of blobs if the list was successfully processed, or</span>
375
<a name="l00274"></a>00274 <span class="comment">// zero if the list had too few characters to be reliable</span>
376
<a name="l00275"></a><a class="code" href="a00688.html#a1007e747656418b79d4ce9f8f14f2a7b">00275</a> <span class="keywordtype">int</span> <a class="code" href="a00687.html#a1007e747656418b79d4ce9f8f14f2a7b">os_detect_blobs</a>(BLOBNBOX_CLIST* blob_list, <a class="code" href="a00478.html">OSResults</a>* osr,
377
<a name="l00276"></a>00276 <a class="code" href="a00607.html">tesseract::Tesseract</a>* tess) {
378
<a name="l00277"></a>00277 <a class="code" href="a00478.html">OSResults</a> osr_;
379
<a name="l00278"></a>00278 <span class="keywordflow">if</span> (osr == NULL)
380
<a name="l00279"></a>00279 osr = &osr_;
381
<a name="l00280"></a>00280
382
<a name="l00281"></a>00281 osr-><a class="code" href="a00478.html#a78ebdae52f3c685095b56790598ad97c">unicharset</a> = &tess-><a class="code" href="a00295.html#a69c5179ac5f10a24f3f97e16ca09460f">unicharset</a>;
383
<a name="l00282"></a>00282 <a class="code" href="a00476.html">OrientationDetector</a> o(osr);
384
<a name="l00283"></a>00283 <a class="code" href="a00530.html">ScriptDetector</a> s(osr, tess);
385
<a name="l00284"></a>00284
386
<a name="l00285"></a>00285 BLOBNBOX_C_IT filtered_it(blob_list);
387
<a name="l00286"></a>00286 <span class="keywordtype">int</span> real_max = MIN(filtered_it.length(), <a class="code" href="a00687.html#ab1eb3d41a8092b2cc34e2c1d17886521">kMaxCharactersToTry</a>);
388
<a name="l00287"></a>00287 <span class="comment">// tprintf("Total blobs found = %d\n", blobs_total);</span>
389
<a name="l00288"></a>00288 <span class="comment">// tprintf("Number of blobs post-filtering = %d\n", filtered_it.length());</span>
390
<a name="l00289"></a>00289 <span class="comment">// tprintf("Number of blobs to try = %d\n", real_max);</span>
391
<a name="l00290"></a>00290
392
<a name="l00291"></a>00291 <span class="comment">// If there are too few characters, skip this page entirely.</span>
393
<a name="l00292"></a>00292 <span class="keywordflow">if</span> (real_max < <a class="code" href="a00687.html#a1dcbb4454cb6c97be113fc6ae820c958">kMinCharactersToTry</a> / 2) {
394
<a name="l00293"></a>00293 <a class="code" href="a00860.html#a02aa7cca2c3857c14716e8cca96ace6c">tprintf</a>(<span class="stringliteral">"Too few characters. Skipping this page\n"</span>);
395
<a name="l00294"></a>00294 <span class="keywordflow">return</span> 0;
396
<a name="l00295"></a>00295 }
397
<a name="l00296"></a>00296
398
<a name="l00297"></a>00297 <a class="code" href="a00279.html">BLOBNBOX</a>** blobs = <span class="keyword">new</span> <a class="code" href="a00279.html">BLOBNBOX</a>*[filtered_it.length()];
399
<a name="l00298"></a>00298 <span class="keywordtype">int</span> number_of_blobs = 0;
400
<a name="l00299"></a>00299 <span class="keywordflow">for</span> (filtered_it.mark_cycle_pt (); !filtered_it.cycled_list ();
401
<a name="l00300"></a>00300 filtered_it.forward ()) {
402
<a name="l00301"></a>00301 blobs[number_of_blobs++] = (<a class="code" href="a00279.html">BLOBNBOX</a>*)filtered_it.data();
403
<a name="l00302"></a>00302 }
404
<a name="l00303"></a>00303 <a class="code" href="a00512.html">QRSequenceGenerator</a> sequence(number_of_blobs);
405
<a name="l00304"></a>00304 <span class="keywordtype">int</span> num_blobs_evaluated = 0;
406
<a name="l00305"></a>00305 <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 0; i < real_max; ++i) {
407
<a name="l00306"></a>00306 <span class="keywordflow">if</span> (<a class="code" href="a00687.html#a35fb2b0177ed2a774307373aeb7b13d1">os_detect_blob</a>(blobs[sequence.<a class="code" href="a00512.html#a28c125707aded762182e647e0ec91900">GetVal</a>()], &o, &s, osr, tess)
408
<a name="l00307"></a>00307 && i > <a class="code" href="a00687.html#a1dcbb4454cb6c97be113fc6ae820c958">kMinCharactersToTry</a>) {
409
<a name="l00308"></a>00308 <span class="keywordflow">break</span>;
410
<a name="l00309"></a>00309 }
411
<a name="l00310"></a>00310 ++num_blobs_evaluated;
412
<a name="l00311"></a>00311 }
413
<a name="l00312"></a>00312 <span class="keyword">delete</span> [] blobs;
414
<a name="l00313"></a>00313
415
<a name="l00314"></a>00314 <span class="comment">// Make sure the best_result is up-to-date</span>
416
<a name="l00315"></a>00315 <span class="keywordtype">int</span> orientation = o.<a class="code" href="a00476.html#a382b5269675f9db848485be62f35742e">get_orientation</a>();
417
<a name="l00316"></a>00316 osr-><a class="code" href="a00478.html#ab796da60cc16d39f464c03fe4047c358">update_best_script</a>(orientation);
418
<a name="l00317"></a>00317 <span class="keywordflow">return</span> num_blobs_evaluated;
419
<a name="l00318"></a>00318 }
420
<a name="l00319"></a>00319
421
<a name="l00320"></a>00320 <span class="comment">// Processes a single blob to estimate script and orientation.</span>
422
<a name="l00321"></a>00321 <span class="comment">// Return true if estimate of orientation and script satisfies stopping</span>
423
<a name="l00322"></a>00322 <span class="comment">// criteria.</span>
424
<a name="l00323"></a><a class="code" href="a00688.html#acd67dc649eafb2a0048434366730af2e">00323</a> <span class="keywordtype">bool</span> <a class="code" href="a00687.html#a35fb2b0177ed2a774307373aeb7b13d1">os_detect_blob</a>(<a class="code" href="a00279.html">BLOBNBOX</a>* bbox, <a class="code" href="a00476.html">OrientationDetector</a>* o,
425
<a name="l00324"></a>00324 <a class="code" href="a00530.html">ScriptDetector</a>* s, <a class="code" href="a00478.html">OSResults</a>* osr,
426
<a name="l00325"></a>00325 <a class="code" href="a00607.html">tesseract::Tesseract</a>* tess) {
427
<a name="l00326"></a>00326 tess-><a class="code" href="a00314.html#a746dbbd1c99e99f3d213077cceedf80e">tess_cn_matching</a>.set_value(<span class="keyword">true</span>); <span class="comment">// turn it on</span>
428
<a name="l00327"></a>00327 tess-><a class="code" href="a00314.html#a85fcc9966cddbc38adf1014dd0cd778c">tess_bn_matching</a>.set_value(<span class="keyword">false</span>);
429
<a name="l00328"></a>00328 <a class="code" href="a00289.html">C_BLOB</a>* blob = bbox-><a class="code" href="a00279.html#a483f44541a4dd818f02225c92f030e07">cblob</a>();
430
<a name="l00329"></a>00329 <a class="code" href="a00591.html">TBLOB</a>* tblob = <a class="code" href="a00591.html#a7b6051e1c1934265a91e1ee864bd5164">TBLOB::PolygonalCopy</a>(tess-><a class="code" href="a00607.html#ae1206c0c4b63a008cc01650004fb7b03">poly_allow_detailed_fx</a>, blob);
431
<a name="l00330"></a>00330 <a class="code" href="a00592.html">TBOX</a> box = tblob-><a class="code" href="a00591.html#a8f1f8f110170fe12cf8147d504cd0ea2">bounding_box</a>();
432
<a name="l00331"></a>00331 <a class="code" href="a00375.html">FCOORD</a> current_rotation(1.0f, 0.0f);
433
<a name="l00332"></a>00332 <a class="code" href="a00375.html">FCOORD</a> rotation90(0.0f, 1.0f);
434
<a name="l00333"></a>00333 BLOB_CHOICE_LIST ratings[4];
435
<a name="l00334"></a>00334 <span class="comment">// Test the 4 orientations</span>
436
<a name="l00335"></a>00335 <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 0; i < 4; ++i) {
437
<a name="l00336"></a>00336 <span class="comment">// Normalize the blob. Set the origin to the place we want to be the</span>
438
<a name="l00337"></a>00337 <span class="comment">// bottom-middle after rotation.</span>
439
<a name="l00338"></a>00338 <span class="comment">// Scaling is to make the rotated height the x-height.</span>
440
<a name="l00339"></a>00339 <span class="keywordtype">float</span> scaling = <span class="keyword">static_cast<</span><span class="keywordtype">float</span><span class="keyword">></span>(<a class="code" href="a00759.html#af974e6755e636c8bc7cbe57e3bcbdd73">kBlnXHeight</a>) / box.<a class="code" href="a00592.html#a8379d4bbc72bdbb1f069fc14790e632d">height</a>();
441
<a name="l00340"></a>00340 <span class="keywordtype">float</span> x_origin = (box.<a class="code" href="a00592.html#a724fabf566586b663577dfa944ffbc61">left</a>() + box.<a class="code" href="a00592.html#a8703081c1a1c26db3a4dddaca1028e34">right</a>()) / 2.0f;
442
<a name="l00341"></a>00341 <span class="keywordtype">float</span> y_origin = (box.<a class="code" href="a00592.html#a4451d237f1cd18c4982d63fe36a11fc3">bottom</a>() + box.<a class="code" href="a00592.html#adf92e9fdac1bdf11c10d1c4d1178791a">top</a>()) / 2.0f;
443
<a name="l00342"></a>00342 <span class="keywordflow">if</span> (i == 0 || i == 2) {
444
<a name="l00343"></a>00343 <span class="comment">// Rotation is 0 or 180.</span>
445
<a name="l00344"></a>00344 y_origin = i == 0 ? box.<a class="code" href="a00592.html#a4451d237f1cd18c4982d63fe36a11fc3">bottom</a>() : box.<a class="code" href="a00592.html#adf92e9fdac1bdf11c10d1c4d1178791a">top</a>();
446
<a name="l00345"></a>00345 } <span class="keywordflow">else</span> {
447
<a name="l00346"></a>00346 <span class="comment">// Rotation is 90 or 270.</span>
448
<a name="l00347"></a>00347 scaling = <span class="keyword">static_cast<</span><span class="keywordtype">float</span><span class="keyword">></span>(<a class="code" href="a00759.html#af974e6755e636c8bc7cbe57e3bcbdd73">kBlnXHeight</a>) / box.<a class="code" href="a00592.html#af95494a2ccacc70cc2b83820b2948619">width</a>();
449
<a name="l00348"></a>00348 x_origin = i == 1 ? box.<a class="code" href="a00592.html#a724fabf566586b663577dfa944ffbc61">left</a>() : box.<a class="code" href="a00592.html#a8703081c1a1c26db3a4dddaca1028e34">right</a>();
450
<a name="l00349"></a>00349 }
451
<a name="l00350"></a>00350 <a class="code" href="a00591.html">TBLOB</a>* rotated_blob = <span class="keyword">new</span> <a class="code" href="a00591.html">TBLOB</a>(*tblob);
452
<a name="l00351"></a>00351 rotated_blob-><a class="code" href="a00591.html#a6aef0201c756ed33e68a94abc8ac2b8e">Normalize</a>(NULL, &current_rotation, NULL,
453
<a name="l00352"></a>00352 x_origin, y_origin, scaling, scaling,
454
<a name="l00353"></a>00353 0.0f, static_cast<float>(<a class="code" href="a00759.html#abe10ce41bf7240ae8a053dea471d6ed5">kBlnBaselineOffset</a>),
455
<a name="l00354"></a>00354 <span class="keyword">false</span>, NULL);
456
<a name="l00355"></a>00355 tess-><a class="code" href="a00314.html#ab39a42222f621c9a5f1bd1b31db3a930">AdaptiveClassifier</a>(rotated_blob, ratings + i);
457
<a name="l00356"></a>00356 <span class="keyword">delete</span> rotated_blob;
458
<a name="l00357"></a>00357 current_rotation.<a class="code" href="a00375.html#a81ca9ea0cac4cd8c1bca0314e29bb28d">rotate</a>(rotation90);
459
<a name="l00358"></a>00358 }
460
<a name="l00359"></a>00359 <span class="keyword">delete</span> tblob;
461
<a name="l00360"></a>00360
462
<a name="l00361"></a>00361 <span class="keywordtype">bool</span> stop = o-><a class="code" href="a00476.html#a7f3ad682712b5ff3bfcecca0a8a5b086">detect_blob</a>(ratings);
463
<a name="l00362"></a>00362 s-><a class="code" href="a00530.html#aa1626a91138960515d479a781a6b97ca">detect_blob</a>(ratings);
464
<a name="l00363"></a>00363 <span class="keywordtype">int</span> orientation = o-><a class="code" href="a00476.html#a382b5269675f9db848485be62f35742e">get_orientation</a>();
465
<a name="l00364"></a>00364 stop = s-><a class="code" href="a00530.html#a951bd4d3f5b14ee234d20afc91d44585">must_stop</a>(orientation) && stop;
466
<a name="l00365"></a>00365 <span class="keywordflow">return</span> stop;
467
<a name="l00366"></a>00366 }
468
<a name="l00367"></a>00367
469
<a name="l00368"></a>00368
470
<a name="l00369"></a><a class="code" href="a00476.html#aa00a93a069267a2636ec74f4ebb11095">00369</a> <a class="code" href="a00476.html#aa00a93a069267a2636ec74f4ebb11095">OrientationDetector::OrientationDetector</a>(<a class="code" href="a00478.html">OSResults</a>* osr) {
471
<a name="l00370"></a>00370 osr_ = osr;
472
<a name="l00371"></a>00371 }
473
<a name="l00372"></a>00372
474
<a name="l00373"></a>00373 <span class="comment">// Score the given blob and return true if it is now sure of the orientation</span>
475
<a name="l00374"></a>00374 <span class="comment">// after adding this block.</span>
476
<a name="l00375"></a><a class="code" href="a00476.html#a7f3ad682712b5ff3bfcecca0a8a5b086">00375</a> <span class="keywordtype">bool</span> <a class="code" href="a00476.html#a7f3ad682712b5ff3bfcecca0a8a5b086">OrientationDetector::detect_blob</a>(BLOB_CHOICE_LIST* scores) {
477
<a name="l00376"></a>00376 <span class="keywordtype">float</span> blob_o_score[4] = {0.0, 0.0, 0.0, 0.0};
478
<a name="l00377"></a>00377 <span class="keywordtype">float</span> total_blob_o_score = 0.0;
479
<a name="l00378"></a>00378
480
<a name="l00379"></a>00379 <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 0; i < 4; ++i) {
481
<a name="l00380"></a>00380 BLOB_CHOICE_IT choice_it;
482
<a name="l00381"></a>00381 choice_it.set_to_list(scores + i);
483
<a name="l00382"></a>00382 <span class="keywordflow">if</span> (!choice_it.empty()) {
484
<a name="l00383"></a>00383 <span class="comment">// The certainty score ranges between [-20,0]. This is converted here to</span>
485
<a name="l00384"></a>00384 <span class="comment">// [0,1], with 1 indicating best match.</span>
486
<a name="l00385"></a>00385 blob_o_score[i] = 1 + 0.05 * choice_it.data()->certainty();
487
<a name="l00386"></a>00386 total_blob_o_score += blob_o_score[i];
488
<a name="l00387"></a>00387 }
489
<a name="l00388"></a>00388 }
490
<a name="l00389"></a>00389 <span class="comment">// Normalize the orientation scores for the blob and use them to</span>
491
<a name="l00390"></a>00390 <span class="comment">// update the aggregated orientation score.</span>
492
<a name="l00391"></a>00391 <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 0; total_blob_o_score != 0 && i < 4; ++i) {
493
<a name="l00392"></a>00392 osr_-><a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[i] += log(blob_o_score[i] / total_blob_o_score);
494
<a name="l00393"></a>00393 }
495
<a name="l00394"></a>00394
496
<a name="l00395"></a>00395 <span class="keywordtype">float</span> first = -1;
497
<a name="l00396"></a>00396 <span class="keywordtype">float</span> second = -1;
498
<a name="l00397"></a>00397
499
<a name="l00398"></a>00398 <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 0; i < 4; ++i) {
500
<a name="l00399"></a>00399 <span class="keywordflow">if</span> (osr_-><a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[i] > first) {
501
<a name="l00400"></a>00400 second = first;
502
<a name="l00401"></a>00401 first = osr_-><a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[i];
503
<a name="l00402"></a>00402 } <span class="keywordflow">else</span> <span class="keywordflow">if</span> (osr_-><a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[i] > second) {
504
<a name="l00403"></a>00403 second = osr_-><a class="code" href="a00478.html#a5fe9fa97000f89cd6f4392b55638e882">orientations</a>[i];
505
<a name="l00404"></a>00404 }
506
<a name="l00405"></a>00405 }
507
<a name="l00406"></a>00406
508
<a name="l00407"></a>00407 <span class="keywordflow">return</span> first / second > <a class="code" href="a00687.html#ad58ecd1e0aa2241ba3ccd5d0398c1e5c">kOrientationAcceptRatio</a>;
509
<a name="l00408"></a>00408 }
510
<a name="l00409"></a>00409
511
<a name="l00410"></a><a class="code" href="a00476.html#a382b5269675f9db848485be62f35742e">00410</a> <span class="keywordtype">int</span> <a class="code" href="a00476.html#a382b5269675f9db848485be62f35742e">OrientationDetector::get_orientation</a>() {
512
<a name="l00411"></a>00411 osr_-><a class="code" href="a00478.html#af7b5cea89a2bdace52ad5825d6d5d4e6">update_best_orientation</a>();
513
<a name="l00412"></a>00412 <span class="keywordflow">return</span> osr_-><a class="code" href="a00478.html#a25f64011ea65c038c1ef1a6cedd10f1c">best_result</a>.<a class="code" href="a00477.html#a6dfb6826b41a81524ce867b005ba5641">orientation_id</a>;
514
<a name="l00413"></a>00413 }
515
<a name="l00414"></a>00414
516
<a name="l00415"></a>00415
517
<a name="l00416"></a><a class="code" href="a00530.html#ac44d1acf5214aecb8437e160e30db1d4">00416</a> <a class="code" href="a00530.html#ac44d1acf5214aecb8437e160e30db1d4">ScriptDetector::ScriptDetector</a>(<a class="code" href="a00478.html">OSResults</a>* osr, <a class="code" href="a00607.html">tesseract::Tesseract</a>* tess) {
518
<a name="l00417"></a>00417 osr_ = osr;
519
<a name="l00418"></a>00418 tess_ = tess;
520
<a name="l00419"></a>00419 katakana_id_ = tess_-><a class="code" href="a00295.html#a69c5179ac5f10a24f3f97e16ca09460f">unicharset</a>.<a class="code" href="a00642.html#a7cbfd800fe71082f0e7d58b7c25330bb">add_script</a>(katakana_script);
521
<a name="l00420"></a>00420 hiragana_id_ = tess_-><a class="code" href="a00295.html#a69c5179ac5f10a24f3f97e16ca09460f">unicharset</a>.<a class="code" href="a00642.html#a7cbfd800fe71082f0e7d58b7c25330bb">add_script</a>(hiragana_script);
522
<a name="l00421"></a>00421 han_id_ = tess_-><a class="code" href="a00295.html#a69c5179ac5f10a24f3f97e16ca09460f">unicharset</a>.<a class="code" href="a00642.html#a7cbfd800fe71082f0e7d58b7c25330bb">add_script</a>(han_script);
523
<a name="l00422"></a>00422 hangul_id_ = tess_-><a class="code" href="a00295.html#a69c5179ac5f10a24f3f97e16ca09460f">unicharset</a>.<a class="code" href="a00642.html#a7cbfd800fe71082f0e7d58b7c25330bb">add_script</a>(hangul_script);
524
<a name="l00423"></a>00423 japanese_id_ = tess_-><a class="code" href="a00295.html#a69c5179ac5f10a24f3f97e16ca09460f">unicharset</a>.<a class="code" href="a00642.html#a7cbfd800fe71082f0e7d58b7c25330bb">add_script</a>(japanese_script_);
525
<a name="l00424"></a>00424 korean_id_ = tess_-><a class="code" href="a00295.html#a69c5179ac5f10a24f3f97e16ca09460f">unicharset</a>.<a class="code" href="a00642.html#a7cbfd800fe71082f0e7d58b7c25330bb">add_script</a>(korean_script_);
526
<a name="l00425"></a>00425 latin_id_ = tess_-><a class="code" href="a00295.html#a69c5179ac5f10a24f3f97e16ca09460f">unicharset</a>.<a class="code" href="a00642.html#a7cbfd800fe71082f0e7d58b7c25330bb">add_script</a>(latin_script);
527
<a name="l00426"></a>00426 fraktur_id_ = tess_-><a class="code" href="a00295.html#a69c5179ac5f10a24f3f97e16ca09460f">unicharset</a>.<a class="code" href="a00642.html#a7cbfd800fe71082f0e7d58b7c25330bb">add_script</a>(fraktur_script_);
528
<a name="l00427"></a>00427 }
529
<a name="l00428"></a>00428
530
<a name="l00429"></a>00429
531
<a name="l00430"></a>00430 <span class="comment">// Score the given blob and return true if it is now sure of the script after</span>
532
<a name="l00431"></a>00431 <span class="comment">// adding this blob.</span>
533
<a name="l00432"></a><a class="code" href="a00530.html#aa1626a91138960515d479a781a6b97ca">00432</a> <span class="keywordtype">void</span> <a class="code" href="a00530.html#aa1626a91138960515d479a781a6b97ca">ScriptDetector::detect_blob</a>(BLOB_CHOICE_LIST* scores) {
534
<a name="l00433"></a>00433 <span class="keywordtype">bool</span> done[<a class="code" href="a00688.html#ab52d878a730b63bcf57d7bb3113882a1">kMaxNumberOfScripts</a>];
535
<a name="l00434"></a>00434 <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 0; i < 4; ++i) {
536
<a name="l00435"></a>00435 <span class="keywordflow">for</span> (<span class="keywordtype">int</span> j = 0; j < <a class="code" href="a00688.html#ab52d878a730b63bcf57d7bb3113882a1">kMaxNumberOfScripts</a>; ++j)
537
<a name="l00436"></a>00436 done[j] = <span class="keyword">false</span>;
538
<a name="l00437"></a>00437
539
<a name="l00438"></a>00438 BLOB_CHOICE_IT choice_it;
540
<a name="l00439"></a>00439 choice_it.set_to_list(scores + i);
541
<a name="l00440"></a>00440
542
<a name="l00441"></a>00441 <span class="keywordtype">float</span> prev_score = -1;
543
<a name="l00442"></a>00442 <span class="keywordtype">int</span> script_count = 0;
544
<a name="l00443"></a>00443 <span class="keywordtype">int</span> prev_id = -1;
545
<a name="l00444"></a>00444 <span class="keywordtype">int</span> prev_fontinfo_id = -1;
546
<a name="l00445"></a>00445 <span class="keyword">const</span> <span class="keywordtype">char</span>* prev_unichar = <span class="stringliteral">""</span>;
547
<a name="l00446"></a>00446 <span class="keyword">const</span> <span class="keywordtype">char</span>* unichar = <span class="stringliteral">""</span>;
548
<a name="l00447"></a>00447
549
<a name="l00448"></a>00448 <span class="keywordflow">for</span> (choice_it.mark_cycle_pt(); !choice_it.cycled_list();
550
<a name="l00449"></a>00449 choice_it.forward()) {
551
<a name="l00450"></a>00450 <a class="code" href="a00276.html">BLOB_CHOICE</a>* choice = choice_it.data();
552
<a name="l00451"></a>00451 <span class="keywordtype">int</span> <span class="keywordtype">id</span> = choice-><a class="code" href="a00276.html#a746d149d149ec75e4bea96f338b48433">script_id</a>();
553
<a name="l00452"></a>00452 <span class="comment">// Script already processed before.</span>
554
<a name="l00453"></a>00453 <span class="keywordflow">if</span> (done[<span class="keywordtype">id</span>]) <span class="keywordflow">continue</span>;
555
<a name="l00454"></a>00454 done[id] = <span class="keyword">true</span>;
556
<a name="l00455"></a>00455
557
<a name="l00456"></a>00456 unichar = tess_-><a class="code" href="a00295.html#a69c5179ac5f10a24f3f97e16ca09460f">unicharset</a>.<a class="code" href="a00642.html#a421c0b6ebcbbe7547490252fb688c961">id_to_unichar</a>(choice-><a class="code" href="a00276.html#aaba6190b77c5f3dc21905fc4118afa94">unichar_id</a>());
558
<a name="l00457"></a>00457 <span class="comment">// Save data from the first match</span>
559
<a name="l00458"></a>00458 <span class="keywordflow">if</span> (prev_score < 0) {
560
<a name="l00459"></a>00459 prev_score = -choice-><a class="code" href="a00276.html#af53d45b718c562ea7209b583c77ac14e">certainty</a>();
561
<a name="l00460"></a>00460 script_count = 1;
562
<a name="l00461"></a>00461 prev_id = id;
563
<a name="l00462"></a>00462 prev_unichar = unichar;
564
<a name="l00463"></a>00463 prev_fontinfo_id = choice-><a class="code" href="a00276.html#a3594e34861be86d775724f5f91fba3be">fontinfo_id</a>();
565
<a name="l00464"></a>00464 } <span class="keywordflow">else</span> <span class="keywordflow">if</span> (-choice-><a class="code" href="a00276.html#af53d45b718c562ea7209b583c77ac14e">certainty</a>() < prev_score + <a class="code" href="a00687.html#a14c7913eafbd3237afbdd7c6b498b2d8">kNonAmbiguousMargin</a>) {
566
<a name="l00465"></a>00465 ++script_count;
567
<a name="l00466"></a>00466 }
568
<a name="l00467"></a>00467
569
<a name="l00468"></a>00468 <span class="keywordflow">if</span> (strlen(prev_unichar) == 1)
570
<a name="l00469"></a>00469 <span class="keywordflow">if</span> (unichar[0] >= <span class="charliteral">'0'</span> && unichar[0] <= <span class="charliteral">'9'</span>)
571
<a name="l00470"></a>00470 <span class="keywordflow">break</span>;
572
<a name="l00471"></a>00471
573
<a name="l00472"></a>00472 <span class="comment">// if script_count is >= 2, character is ambiguous, skip other matches</span>
574
<a name="l00473"></a>00473 <span class="comment">// since they are useless.</span>
575
<a name="l00474"></a>00474 <span class="keywordflow">if</span> (script_count >= 2)
576
<a name="l00475"></a>00475 <span class="keywordflow">break</span>;
577
<a name="l00476"></a>00476 }
578
<a name="l00477"></a>00477 <span class="comment">// Character is non ambiguous</span>
579
<a name="l00478"></a>00478 <span class="keywordflow">if</span> (script_count == 1) {
580
<a name="l00479"></a>00479 <span class="comment">// Update the score of the winning script</span>
581
<a name="l00480"></a>00480 osr_-><a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[i][prev_id] += 1.0;
582
<a name="l00481"></a>00481
583
<a name="l00482"></a>00482 <span class="comment">// Workaround for Fraktur</span>
584
<a name="l00483"></a>00483 <span class="keywordflow">if</span> (prev_id == latin_id_) {
585
<a name="l00484"></a>00484 <span class="keywordflow">if</span> (prev_fontinfo_id >= 0) {
586
<a name="l00485"></a>00485 <span class="keyword">const</span> <a class="code" href="a00389.html">tesseract::FontInfo</a> &fi =
587
<a name="l00486"></a>00486 tess_-><a class="code" href="a00314.html#a62597f182a5e23c3b8a030c06e699e99">get_fontinfo_table</a>().<a class="code" href="a00643.html#a3b3107bc72d9edfe501eaba7404de7eb" title="Return the object from an id.">get</a>(prev_fontinfo_id);
588
<a name="l00487"></a>00487 <span class="comment">//printf("Font: %s i:%i b:%i f:%i s:%i k:%i (%s)\n", fi.name,</span>
589
<a name="l00488"></a>00488 <span class="comment">// fi.is_italic(), fi.is_bold(), fi.is_fixed_pitch(),</span>
590
<a name="l00489"></a>00489 <span class="comment">// fi.is_serif(), fi.is_fraktur(),</span>
591
<a name="l00490"></a>00490 <span class="comment">// prev_unichar);</span>
592
<a name="l00491"></a>00491 <span class="keywordflow">if</span> (fi.<a class="code" href="a00389.html#a5a918bad85fde70770f60853355c1716">is_fraktur</a>()) {
593
<a name="l00492"></a>00492 osr_-><a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[i][prev_id] -= 1.0;
594
<a name="l00493"></a>00493 osr_-><a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[i][fraktur_id_] += 1.0;
595
<a name="l00494"></a>00494 }
596
<a name="l00495"></a>00495 }
597
<a name="l00496"></a>00496 }
598
<a name="l00497"></a>00497
599
<a name="l00498"></a>00498 <span class="comment">// Update Japanese / Korean pseudo-scripts</span>
600
<a name="l00499"></a>00499 <span class="keywordflow">if</span> (prev_id == katakana_id_)
601
<a name="l00500"></a>00500 osr_-><a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[i][japanese_id_] += 1.0;
602
<a name="l00501"></a>00501 <span class="keywordflow">if</span> (prev_id == hiragana_id_)
603
<a name="l00502"></a>00502 osr_-><a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[i][japanese_id_] += 1.0;
604
<a name="l00503"></a>00503 <span class="keywordflow">if</span> (prev_id == hangul_id_)
605
<a name="l00504"></a>00504 osr_-><a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[i][korean_id_] += 1.0;
606
<a name="l00505"></a>00505 <span class="keywordflow">if</span> (prev_id == han_id_)
607
<a name="l00506"></a>00506 osr_-><a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[i][korean_id_] += <a class="code" href="a00687.html#ae3f12edb58f6ed0a11daea2cbf8dc547">kHanRatioInKorean</a>;
608
<a name="l00507"></a>00507 <span class="keywordflow">if</span> (prev_id == han_id_)
609
<a name="l00508"></a>00508 osr_-><a class="code" href="a00478.html#af612cc25d8432678d5b87a5911544792">scripts_na</a>[i][japanese_id_] += <a class="code" href="a00687.html#aab3b7e76eea520b1e4b9d68165e3a094">kHanRatioInJapanese</a>;
610
<a name="l00509"></a>00509 }
611
<a name="l00510"></a>00510 } <span class="comment">// iterate over each orientation</span>
612
<a name="l00511"></a>00511 }
613
<a name="l00512"></a>00512
614
<a name="l00513"></a><a class="code" href="a00530.html#a951bd4d3f5b14ee234d20afc91d44585">00513</a> <span class="keywordtype">bool</span> <a class="code" href="a00530.html#a951bd4d3f5b14ee234d20afc91d44585">ScriptDetector::must_stop</a>(<span class="keywordtype">int</span> orientation) {
615
<a name="l00514"></a>00514 osr_-><a class="code" href="a00478.html#ab796da60cc16d39f464c03fe4047c358">update_best_script</a>(orientation);
616
<a name="l00515"></a>00515 <span class="keywordflow">return</span> osr_-><a class="code" href="a00478.html#a25f64011ea65c038c1ef1a6cedd10f1c">best_result</a>.<a class="code" href="a00477.html#ae39a2c718b010ed27eb7f820546da6d6">sconfidence</a> > 1;
617
<a name="l00516"></a>00516 }
618
<a name="l00517"></a>00517
619
<a name="l00518"></a>00518 <span class="comment">// Helper method to convert an orientation index to its value in degrees.</span>
620
<a name="l00519"></a>00519 <span class="comment">// The value represents the amount of clockwise rotation in degrees that must be</span>
621
<a name="l00520"></a>00520 <span class="comment">// applied for the text to be upright (readable).</span>
622
<a name="l00521"></a><a class="code" href="a00688.html#a4239adc5aad0a7487a6d414f91fc41b2">00521</a> <span class="keyword">const</span> <span class="keywordtype">int</span> <a class="code" href="a00687.html#a94d19668c76dab0d8ab3832c765303da">OrientationIdToValue</a>(<span class="keyword">const</span> <span class="keywordtype">int</span>& <span class="keywordtype">id</span>) {
623
<a name="l00522"></a>00522 <span class="keywordflow">switch</span> (<span class="keywordtype">id</span>) {
624
<a name="l00523"></a>00523 <span class="keywordflow">case</span> 0:
625
<a name="l00524"></a>00524 <span class="keywordflow">return</span> 0;
626
<a name="l00525"></a>00525 <span class="keywordflow">case</span> 1:
627
<a name="l00526"></a>00526 <span class="keywordflow">return</span> 270;
628
<a name="l00527"></a>00527 <span class="keywordflow">case</span> 2:
629
<a name="l00528"></a>00528 <span class="keywordflow">return</span> 180;
630
<a name="l00529"></a>00529 <span class="keywordflow">case</span> 3:
631
<a name="l00530"></a>00530 <span class="keywordflow">return</span> 90;
632
<a name="l00531"></a>00531 <span class="keywordflow">default</span>:
633
<a name="l00532"></a>00532 <span class="keywordflow">return</span> -1;
634
<a name="l00533"></a>00533 }
635
<a name="l00534"></a>00534 }
636
</pre></div></div><!-- contents -->
638
<!-- window showing the filter options -->
639
<div id="MSearchSelectWindow"
640
onmouseover="return searchBox.OnSearchSelectShow()"
641
onmouseout="return searchBox.OnSearchSelectHide()"
642
onkeydown="return searchBox.OnSearchSelectKey(event)">
643
<a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(0)"><span class="SelectionMark"> </span>All</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(1)"><span class="SelectionMark"> </span>Classes</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(2)"><span class="SelectionMark"> </span>Namespaces</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(3)"><span class="SelectionMark"> </span>Files</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(4)"><span class="SelectionMark"> </span>Functions</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(5)"><span class="SelectionMark"> </span>Variables</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(6)"><span class="SelectionMark"> </span>Typedefs</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(7)"><span class="SelectionMark"> </span>Enumerations</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(8)"><span class="SelectionMark"> </span>Enumerator</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(9)"><span class="SelectionMark"> </span>Friends</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(10)"><span class="SelectionMark"> </span>Defines</a></div>
645
<!-- iframe showing the search results (closed by default) -->
646
<div id="MSearchResultsWindow">
647
<iframe src="javascript:void(0)" frameborder="0"
648
name="MSearchResults" id="MSearchResults">
652
<div id="nav-path" class="navpath">
654
<li class="navelem"><a class="el" href="a00687.html">osdetect.cpp</a> </li>
656
<li class="footer">Generated on Mon Feb 3 2014 10:59:07 for tesseract by
657
<a href="http://www.doxygen.org/index.html">
658
<img class="footer" src="doxygen.png" alt="doxygen"/></a> 1.7.6.1 </li>