~ubuntu-branches/ubuntu/vivid/tesseract/vivid

« back to all changes in this revision

Viewing changes to doc/html/a01106_source.html

  • Committer: Package Import Robot
  • Author(s): Jeff Breidenbach
  • Date: 2014-02-03 11:10:20 UTC
  • mfrom: (1.3.1) (19.1.1 experimental)
  • Revision ID: package-import@ubuntu.com-20140203111020-igquodd7pjlp3uri
Tags: 3.03.01-1
* New upstream release, includes critical fix to PDF rendering
* Complete leptonlib transition (see bug #735509)
* Promote from experimental to unstable

Show diffs side-by-side

added added

removed removed

Lines of Context:
 
1
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
 
2
<html xmlns="http://www.w3.org/1999/xhtml">
 
3
<head>
 
4
<meta http-equiv="Content-Type" content="text/xhtml;charset=UTF-8"/>
 
5
<meta http-equiv="X-UA-Compatible" content="IE=9"/>
 
6
<title>tesseract: /usr/local/google/home/jbreiden/tesseract-ocr-read-only/textord/devanagari_processing.cpp Source File</title>
 
7
 
 
8
<link href="tabs.css" rel="stylesheet" type="text/css"/>
 
9
<link href="doxygen.css" rel="stylesheet" type="text/css" />
 
10
<link href="navtree.css" rel="stylesheet" type="text/css"/>
 
11
<script type="text/javascript" src="jquery.js"></script>
 
12
<script type="text/javascript" src="resize.js"></script>
 
13
<script type="text/javascript" src="navtree.js"></script>
 
14
<script type="text/javascript">
 
15
  $(document).ready(initResizable);
 
16
</script>
 
17
<link href="search/search.css" rel="stylesheet" type="text/css"/>
 
18
<script type="text/javascript" src="search/search.js"></script>
 
19
<script type="text/javascript">
 
20
  $(document).ready(function() { searchBox.OnSelectItem(0); });
 
21
</script>
 
22
 
 
23
</head>
 
24
<body>
 
25
<div id="top"><!-- do not remove this div! -->
 
26
 
 
27
 
 
28
<div id="titlearea">
 
29
<table cellspacing="0" cellpadding="0">
 
30
 <tbody>
 
31
 <tr style="height: 56px;">
 
32
  
 
33
  
 
34
  <td style="padding-left: 0.5em;">
 
35
   <div id="projectname">tesseract
 
36
   &#160;<span id="projectnumber">3.03</span>
 
37
   </div>
 
38
   
 
39
  </td>
 
40
  
 
41
  
 
42
  
 
43
 </tr>
 
44
 </tbody>
 
45
</table>
 
46
</div>
 
47
 
 
48
<!-- Generated by Doxygen 1.7.6.1 -->
 
49
<script type="text/javascript">
 
50
var searchBox = new SearchBox("searchBox", "search",false,'Search');
 
51
</script>
 
52
  <div id="navrow1" class="tabs">
 
53
    <ul class="tablist">
 
54
      <li><a href="index.html"><span>Main&#160;Page</span></a></li>
 
55
      <li><a href="pages.html"><span>Related&#160;Pages</span></a></li>
 
56
      <li><a href="modules.html"><span>Modules</span></a></li>
 
57
      <li><a href="namespaces.html"><span>Namespaces</span></a></li>
 
58
      <li><a href="annotated.html"><span>Classes</span></a></li>
 
59
      <li class="current"><a href="files.html"><span>Files</span></a></li>
 
60
      <li>
 
61
        <div id="MSearchBox" class="MSearchBoxInactive">
 
62
        <span class="left">
 
63
          <img id="MSearchSelect" src="search/mag_sel.png"
 
64
               onmouseover="return searchBox.OnSearchSelectShow()"
 
65
               onmouseout="return searchBox.OnSearchSelectHide()"
 
66
               alt=""/>
 
67
          <input type="text" id="MSearchField" value="Search" accesskey="S"
 
68
               onfocus="searchBox.OnSearchFieldFocus(true)" 
 
69
               onblur="searchBox.OnSearchFieldFocus(false)" 
 
70
               onkeyup="searchBox.OnSearchFieldChange(event)"/>
 
71
          </span><span class="right">
 
72
            <a id="MSearchClose" href="javascript:searchBox.CloseResultsWindow()"><img id="MSearchCloseImg" border="0" src="search/close.png" alt=""/></a>
 
73
          </span>
 
74
        </div>
 
75
      </li>
 
76
    </ul>
 
77
  </div>
 
78
  <div id="navrow2" class="tabs2">
 
79
    <ul class="tablist">
 
80
      <li><a href="files.html"><span>File&#160;List</span></a></li>
 
81
      <li><a href="globals.html"><span>File&#160;Members</span></a></li>
 
82
    </ul>
 
83
  </div>
 
84
</div>
 
85
<div id="side-nav" class="ui-resizable side-nav-resizable">
 
86
  <div id="nav-tree">
 
87
    <div id="nav-tree-contents">
 
88
    </div>
 
89
  </div>
 
90
  <div id="splitbar" style="-moz-user-select:none;" 
 
91
       class="ui-resizable-handle">
 
92
  </div>
 
93
</div>
 
94
<script type="text/javascript">
 
95
  initNavTree('a01106.html','');
 
96
</script>
 
97
<div id="doc-content">
 
98
<div class="header">
 
99
  <div class="headertitle">
 
100
<div class="title">/usr/local/google/home/jbreiden/tesseract-ocr-read-only/textord/devanagari_processing.cpp</div>  </div>
 
101
</div><!--header-->
 
102
<div class="contents">
 
103
<a href="a01106.html">Go to the documentation of this file.</a><div class="fragment"><pre class="fragment"><a name="l00001"></a>00001 <span class="comment">/**********************************************************************</span>
 
104
<a name="l00002"></a>00002 <span class="comment"> * File:        devanagari_processing.cpp</span>
 
105
<a name="l00003"></a>00003 <span class="comment"> * Description: Methods to process images containing devanagari symbols,</span>
 
106
<a name="l00004"></a>00004 <span class="comment"> *              prior to classification.</span>
 
107
<a name="l00005"></a>00005 <span class="comment"> * Author:      Shobhit Saxena</span>
 
108
<a name="l00006"></a>00006 <span class="comment"> * Created:     Mon Nov 17 20:26:01 IST 2008</span>
 
109
<a name="l00007"></a>00007 <span class="comment"> *</span>
 
110
<a name="l00008"></a>00008 <span class="comment"> * (C) Copyright 2008, Google Inc.</span>
 
111
<a name="l00009"></a>00009 <span class="comment"> ** Licensed under the Apache License, Version 2.0 (the &quot;License&quot;);</span>
 
112
<a name="l00010"></a>00010 <span class="comment"> ** you may not use this file except in compliance with the License.</span>
 
113
<a name="l00011"></a>00011 <span class="comment"> ** You may obtain a copy of the License at</span>
 
114
<a name="l00012"></a>00012 <span class="comment"> ** http://www.apache.org/licenses/LICENSE-2.0</span>
 
115
<a name="l00013"></a>00013 <span class="comment"> ** Unless required by applicable law or agreed to in writing, software</span>
 
116
<a name="l00014"></a>00014 <span class="comment"> ** distributed under the License is distributed on an &quot;AS IS&quot; BASIS,</span>
 
117
<a name="l00015"></a>00015 <span class="comment"> ** WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.</span>
 
118
<a name="l00016"></a>00016 <span class="comment"> ** See the License for the specific language governing permissions and</span>
 
119
<a name="l00017"></a>00017 <span class="comment"> ** limitations under the License.</span>
 
120
<a name="l00018"></a>00018 <span class="comment"> *</span>
 
121
<a name="l00019"></a>00019 <span class="comment"> **********************************************************************/</span>
 
122
<a name="l00020"></a>00020 
 
123
<a name="l00021"></a>00021 <span class="preprocessor">#ifdef HAVE_CONFIG_H</span>
 
124
<a name="l00022"></a>00022 <span class="preprocessor"></span><span class="preprocessor">#include &quot;<a class="code" href="a00950.html">config_auto.h</a>&quot;</span>
 
125
<a name="l00023"></a>00023 <span class="preprocessor">#endif</span>
 
126
<a name="l00024"></a>00024 <span class="preprocessor"></span>
 
127
<a name="l00025"></a>00025 <span class="preprocessor">#include &quot;<a class="code" href="a01107.html">devanagari_processing.h</a>&quot;</span>
 
128
<a name="l00026"></a>00026 <span class="preprocessor">#include &quot;allheaders.h&quot;</span>
 
129
<a name="l00027"></a>00027 <span class="preprocessor">#include &quot;<a class="code" href="a01155.html">tordmain.h</a>&quot;</span>
 
130
<a name="l00028"></a>00028 <span class="preprocessor">#include &quot;<a class="code" href="a00798.html">statistc.h</a>&quot;</span>
 
131
<a name="l00029"></a>00029 
 
132
<a name="l00030"></a>00030 <span class="comment">// Flags controlling the debugging information for shiro-rekha splitting</span>
 
133
<a name="l00031"></a>00031 <span class="comment">// strategies.</span>
 
134
<a name="l00032"></a>00032 <a class="code" href="a00844.html#a554d43d0cf0e3f9552921941d9e147bd">INT_VAR</a>(<a class="code" href="a01106.html#ad6b4d3ded1df0799766c874662d63050">devanagari_split_debuglevel</a>, 0,
 
135
<a name="l00033"></a><a class="code" href="a01107.html#ad6b4d3ded1df0799766c874662d63050">00033</a>         <span class="stringliteral">&quot;Debug level for split shiro-rekha process.&quot;</span>);
 
136
<a name="l00034"></a>00034 
 
137
<a name="l00035"></a>00035 <a class="code" href="a00844.html#a442e7f541a050acf5ebda026db177877">BOOL_VAR</a>(<a class="code" href="a01106.html#a9687e850f464694be20c21d93e891801">devanagari_split_debugimage</a>, 0,
 
138
<a name="l00036"></a><a class="code" href="a01107.html#a9687e850f464694be20c21d93e891801">00036</a>          <span class="stringliteral">&quot;Whether to create a debug image for split shiro-rekha process.&quot;</span>);
 
139
<a name="l00037"></a>00037 
 
140
<a name="l00038"></a>00038 <span class="keyword">namespace </span><a class="code" href="a01266.html#afed58feacb84df2de88bdd613cfdba6d">tesseract</a> {
 
141
<a name="l00039"></a>00039 
 
142
<a name="l00040"></a><a class="code" href="a00545.html#a09814382ca566884157cceab9076fff2">00040</a> <a class="code" href="a00545.html#a09814382ca566884157cceab9076fff2">ShiroRekhaSplitter::ShiroRekhaSplitter</a>() {
 
143
<a name="l00041"></a>00041   orig_pix_ = NULL;
 
144
<a name="l00042"></a>00042   segmentation_block_list_ = NULL;
 
145
<a name="l00043"></a>00043   splitted_image_ = NULL;
 
146
<a name="l00044"></a>00044   global_xheight_ = <a class="code" href="a00545.html#ac973904ee08ed3d33aa15afc9dc2a903">kUnspecifiedXheight</a>;
 
147
<a name="l00045"></a>00045   perform_close_ = <span class="keyword">false</span>;
 
148
<a name="l00046"></a>00046   debug_image_ = NULL;
 
149
<a name="l00047"></a>00047   pageseg_split_strategy_ = <a class="code" href="a00545.html#ab44f3b6e26668478841a5b8c45332601a1ca815839c8e78def404b329ba79697a">NO_SPLIT</a>;
 
150
<a name="l00048"></a>00048   ocr_split_strategy_ = <a class="code" href="a00545.html#ab44f3b6e26668478841a5b8c45332601a1ca815839c8e78def404b329ba79697a">NO_SPLIT</a>;
 
151
<a name="l00049"></a>00049 }
 
152
<a name="l00050"></a>00050 
 
153
<a name="l00051"></a><a class="code" href="a00545.html#a018fa239787df6051031ac4627e442cb">00051</a> <a class="code" href="a00545.html#a018fa239787df6051031ac4627e442cb">ShiroRekhaSplitter::~ShiroRekhaSplitter</a>() {
 
154
<a name="l00052"></a>00052   <a class="code" href="a00545.html#a8bfcc88be2d166b396f760d10ae29f18">Clear</a>();
 
155
<a name="l00053"></a>00053 }
 
156
<a name="l00054"></a>00054 
 
157
<a name="l00055"></a><a class="code" href="a00545.html#a8bfcc88be2d166b396f760d10ae29f18">00055</a> <span class="keywordtype">void</span> <a class="code" href="a00545.html#a8bfcc88be2d166b396f760d10ae29f18">ShiroRekhaSplitter::Clear</a>() {
 
158
<a name="l00056"></a>00056   pixDestroy(&amp;orig_pix_);
 
159
<a name="l00057"></a>00057   pixDestroy(&amp;splitted_image_);
 
160
<a name="l00058"></a>00058   pageseg_split_strategy_ = <a class="code" href="a00545.html#ab44f3b6e26668478841a5b8c45332601a1ca815839c8e78def404b329ba79697a">NO_SPLIT</a>;
 
161
<a name="l00059"></a>00059   ocr_split_strategy_ = <a class="code" href="a00545.html#ab44f3b6e26668478841a5b8c45332601a1ca815839c8e78def404b329ba79697a">NO_SPLIT</a>;
 
162
<a name="l00060"></a>00060   pixDestroy(&amp;debug_image_);
 
163
<a name="l00061"></a>00061   segmentation_block_list_ = NULL;
 
164
<a name="l00062"></a>00062   global_xheight_ = <a class="code" href="a00545.html#ac973904ee08ed3d33aa15afc9dc2a903">kUnspecifiedXheight</a>;
 
165
<a name="l00063"></a>00063   perform_close_ = <span class="keyword">false</span>;
 
166
<a name="l00064"></a>00064 }
 
167
<a name="l00065"></a>00065 
 
168
<a name="l00066"></a>00066 <span class="comment">// This method dumps a debug image to the specified location.</span>
 
169
<a name="l00067"></a><a class="code" href="a00545.html#ac60692d8c95f1ed1505adbd2554ece53">00067</a> <span class="keywordtype">void</span> <a class="code" href="a00545.html#ac60692d8c95f1ed1505adbd2554ece53">ShiroRekhaSplitter::DumpDebugImage</a>(<span class="keyword">const</span> <span class="keywordtype">char</span>* <a class="code" href="a01266.html#a61c02c0afc996e6b9c619f0a757af50b">filename</a>)<span class="keyword"> const </span>{
 
170
<a name="l00068"></a>00068   pixWrite(filename, debug_image_, IFF_PNG);
 
171
<a name="l00069"></a>00069 }
 
172
<a name="l00070"></a>00070 
 
173
<a name="l00071"></a>00071 <span class="comment">// On setting the input image, a clone of it is owned by this class.</span>
 
174
<a name="l00072"></a><a class="code" href="a00545.html#aef511d3502b7ea23cde356ef6454f064">00072</a> <span class="keywordtype">void</span> <a class="code" href="a00545.html#aef511d3502b7ea23cde356ef6454f064">ShiroRekhaSplitter::set_orig_pix</a>(Pix* pix) {
 
175
<a name="l00073"></a>00073   <span class="keywordflow">if</span> (orig_pix_) {
 
176
<a name="l00074"></a>00074     pixDestroy(&amp;orig_pix_);
 
177
<a name="l00075"></a>00075   }
 
178
<a name="l00076"></a>00076   orig_pix_ = pixClone(pix);
 
179
<a name="l00077"></a>00077 }
 
180
<a name="l00078"></a>00078 
 
181
<a name="l00079"></a>00079 <span class="comment">// Top-level method to perform splitting based on current settings.</span>
 
182
<a name="l00080"></a>00080 <span class="comment">// Returns true if a split was actually performed.</span>
 
183
<a name="l00081"></a>00081 <span class="comment">// split_for_pageseg should be true if the splitting is being done prior to</span>
 
184
<a name="l00082"></a>00082 <span class="comment">// page segmentation. This mode uses the flag</span>
 
185
<a name="l00083"></a>00083 <span class="comment">// pageseg_devanagari_split_strategy to determine the splitting strategy.</span>
 
186
<a name="l00084"></a><a class="code" href="a00545.html#a28e6f7d06927c5742be73589cb3eefcf">00084</a> <span class="keywordtype">bool</span> <a class="code" href="a00545.html#a28e6f7d06927c5742be73589cb3eefcf">ShiroRekhaSplitter::Split</a>(<span class="keywordtype">bool</span> split_for_pageseg) {
 
187
<a name="l00085"></a>00085   <a class="code" href="a00545.html#ab44f3b6e26668478841a5b8c45332601">SplitStrategy</a> split_strategy = split_for_pageseg ? pageseg_split_strategy_ :
 
188
<a name="l00086"></a>00086       ocr_split_strategy_;
 
189
<a name="l00087"></a>00087   <span class="keywordflow">if</span> (split_strategy == <a class="code" href="a00545.html#ab44f3b6e26668478841a5b8c45332601a1ca815839c8e78def404b329ba79697a">NO_SPLIT</a>) {
 
190
<a name="l00088"></a>00088     <span class="keywordflow">return</span> <span class="keyword">false</span>;  <span class="comment">// Nothing to do.</span>
 
191
<a name="l00089"></a>00089   }
 
192
<a name="l00090"></a>00090   <a class="code" href="a00823.html#a93a603f4063a6b9403d81caa245a583b">ASSERT_HOST</a>(split_strategy == <a class="code" href="a00545.html#ab44f3b6e26668478841a5b8c45332601abb20813b04f412bb19593e228c343503">MINIMAL_SPLIT</a> ||
 
193
<a name="l00091"></a>00091               split_strategy == <a class="code" href="a00545.html#ab44f3b6e26668478841a5b8c45332601a8835ad2cdb469808d2aa1d4c8546426c">MAXIMAL_SPLIT</a>);
 
194
<a name="l00092"></a>00092   <a class="code" href="a00823.html#a93a603f4063a6b9403d81caa245a583b">ASSERT_HOST</a>(orig_pix_);
 
195
<a name="l00093"></a>00093   <span class="keywordflow">if</span> (<a class="code" href="a01106.html#ad6b4d3ded1df0799766c874662d63050">devanagari_split_debuglevel</a> &gt; 0) {
 
196
<a name="l00094"></a>00094     <a class="code" href="a00860.html#a02aa7cca2c3857c14716e8cca96ace6c">tprintf</a>(<span class="stringliteral">&quot;Splitting shiro-rekha ...\n&quot;</span>);
 
197
<a name="l00095"></a>00095     <a class="code" href="a00860.html#a02aa7cca2c3857c14716e8cca96ace6c">tprintf</a>(<span class="stringliteral">&quot;Split strategy = %s\n&quot;</span>,
 
198
<a name="l00096"></a>00096             split_strategy == <a class="code" href="a00545.html#ab44f3b6e26668478841a5b8c45332601abb20813b04f412bb19593e228c343503">MINIMAL_SPLIT</a> ? <span class="stringliteral">&quot;Minimal&quot;</span> : <span class="stringliteral">&quot;Maximal&quot;</span>);
 
199
<a name="l00097"></a>00097     <a class="code" href="a00860.html#a02aa7cca2c3857c14716e8cca96ace6c">tprintf</a>(<span class="stringliteral">&quot;Initial pageseg available = %s\n&quot;</span>,
 
200
<a name="l00098"></a>00098             segmentation_block_list_ ? <span class="stringliteral">&quot;yes&quot;</span> : <span class="stringliteral">&quot;no&quot;</span>);
 
201
<a name="l00099"></a>00099   }
 
202
<a name="l00100"></a>00100   <span class="comment">// Create a copy of original image to store the splitting output.</span>
 
203
<a name="l00101"></a>00101   pixDestroy(&amp;splitted_image_);
 
204
<a name="l00102"></a>00102   splitted_image_ = pixCopy(NULL, orig_pix_);
 
205
<a name="l00103"></a>00103 
 
206
<a name="l00104"></a>00104   <span class="comment">// Initialize debug image if required.</span>
 
207
<a name="l00105"></a>00105   <span class="keywordflow">if</span> (<a class="code" href="a01106.html#a9687e850f464694be20c21d93e891801">devanagari_split_debugimage</a>) {
 
208
<a name="l00106"></a>00106     pixDestroy(&amp;debug_image_);
 
209
<a name="l00107"></a>00107     debug_image_ = pixConvertTo32(orig_pix_);
 
210
<a name="l00108"></a>00108   }
 
211
<a name="l00109"></a>00109 
 
212
<a name="l00110"></a>00110   <span class="comment">// Determine all connected components in the input image. A close operation</span>
 
213
<a name="l00111"></a>00111   <span class="comment">// may be required prior to this, depending on the current settings.</span>
 
214
<a name="l00112"></a>00112   Pix* pix_for_ccs = pixClone(orig_pix_);
 
215
<a name="l00113"></a>00113   <span class="keywordflow">if</span> (perform_close_ &amp;&amp; global_xheight_ != <a class="code" href="a00545.html#ac973904ee08ed3d33aa15afc9dc2a903">kUnspecifiedXheight</a> &amp;&amp;
 
216
<a name="l00114"></a>00114       !segmentation_block_list_) {
 
217
<a name="l00115"></a>00115     <span class="keywordflow">if</span> (<a class="code" href="a01106.html#ad6b4d3ded1df0799766c874662d63050">devanagari_split_debuglevel</a> &gt; 0) {
 
218
<a name="l00116"></a>00116       <a class="code" href="a00860.html#a02aa7cca2c3857c14716e8cca96ace6c">tprintf</a>(<span class="stringliteral">&quot;Performing a global close operation..\n&quot;</span>);
 
219
<a name="l00117"></a>00117     }
 
220
<a name="l00118"></a>00118     <span class="comment">// A global measure is available for xheight, but no local information</span>
 
221
<a name="l00119"></a>00119     <span class="comment">// exists.</span>
 
222
<a name="l00120"></a>00120     pixDestroy(&amp;pix_for_ccs);
 
223
<a name="l00121"></a>00121     pix_for_ccs = pixCopy(NULL, orig_pix_);
 
224
<a name="l00122"></a>00122     PerformClose(pix_for_ccs, global_xheight_);
 
225
<a name="l00123"></a>00123   }
 
226
<a name="l00124"></a>00124   Pixa* ccs;
 
227
<a name="l00125"></a>00125   Boxa* tmp_boxa = pixConnComp(pix_for_ccs, &amp;ccs, 8);
 
228
<a name="l00126"></a>00126   boxaDestroy(&amp;tmp_boxa);
 
229
<a name="l00127"></a>00127   pixDestroy(&amp;pix_for_ccs);
 
230
<a name="l00128"></a>00128 
 
231
<a name="l00129"></a>00129   <span class="comment">// Iterate over all connected components. Get their bounding boxes and clip</span>
 
232
<a name="l00130"></a>00130   <span class="comment">// out the image regions corresponding to these boxes from the original image.</span>
 
233
<a name="l00131"></a>00131   <span class="comment">// Conditionally run splitting on each of them.</span>
 
234
<a name="l00132"></a>00132   Boxa* regions_to_clear = boxaCreate(0);
 
235
<a name="l00133"></a>00133   <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 0; i &lt; pixaGetCount(ccs); ++i) {
 
236
<a name="l00134"></a>00134     Box* box = ccs-&gt;boxa-&gt;box[i];
 
237
<a name="l00135"></a>00135     Pix* word_pix = pixClipRectangle(orig_pix_, box, NULL);
 
238
<a name="l00136"></a>00136     <a class="code" href="a00823.html#a93a603f4063a6b9403d81caa245a583b">ASSERT_HOST</a>(word_pix);
 
239
<a name="l00137"></a>00137     <span class="keywordtype">int</span> xheight = GetXheightForCC(box);
 
240
<a name="l00138"></a>00138     <span class="keywordflow">if</span> (xheight == <a class="code" href="a00545.html#ac973904ee08ed3d33aa15afc9dc2a903">kUnspecifiedXheight</a> &amp;&amp; segmentation_block_list_ &amp;&amp;
 
241
<a name="l00139"></a>00139         <a class="code" href="a01106.html#a9687e850f464694be20c21d93e891801">devanagari_split_debugimage</a>) {
 
242
<a name="l00140"></a>00140       pixRenderBoxArb(debug_image_, box, 1, 255, 0, 0);
 
243
<a name="l00141"></a>00141     }
 
244
<a name="l00142"></a>00142     <span class="comment">// If some xheight measure is available, attempt to pre-eliminate small</span>
 
245
<a name="l00143"></a>00143     <span class="comment">// blobs from the shiro-rekha process. This is primarily to save the CCs</span>
 
246
<a name="l00144"></a>00144     <span class="comment">// corresponding to punctuation marks/small dots etc which are part of</span>
 
247
<a name="l00145"></a>00145     <span class="comment">// larger graphemes.</span>
 
248
<a name="l00146"></a>00146     <span class="keywordflow">if</span> (xheight == <a class="code" href="a00545.html#ac973904ee08ed3d33aa15afc9dc2a903">kUnspecifiedXheight</a> ||
 
249
<a name="l00147"></a>00147         (box-&gt;w &gt; xheight / 3 &amp;&amp; box-&gt;h &gt; xheight / 2)) {
 
250
<a name="l00148"></a>00148       SplitWordShiroRekha(split_strategy, word_pix, xheight,
 
251
<a name="l00149"></a>00149                           box-&gt;x, box-&gt;y, regions_to_clear);
 
252
<a name="l00150"></a>00150     } <span class="keywordflow">else</span> <span class="keywordflow">if</span> (<a class="code" href="a01106.html#ad6b4d3ded1df0799766c874662d63050">devanagari_split_debuglevel</a> &gt; 0) {
 
253
<a name="l00151"></a>00151       <a class="code" href="a00860.html#a02aa7cca2c3857c14716e8cca96ace6c">tprintf</a>(<span class="stringliteral">&quot;CC dropped from splitting: %d,%d (%d, %d)\n&quot;</span>,
 
254
<a name="l00152"></a>00152               box-&gt;x, box-&gt;y, box-&gt;w, box-&gt;h);
 
255
<a name="l00153"></a>00153     }
 
256
<a name="l00154"></a>00154     pixDestroy(&amp;word_pix);
 
257
<a name="l00155"></a>00155   }
 
258
<a name="l00156"></a>00156   <span class="comment">// Actually clear the boxes now.</span>
 
259
<a name="l00157"></a>00157   <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 0; i &lt; boxaGetCount(regions_to_clear); ++i) {
 
260
<a name="l00158"></a>00158     Box* box = boxaGetBox(regions_to_clear, i, L_CLONE);
 
261
<a name="l00159"></a>00159     pixClearInRect(splitted_image_, box);
 
262
<a name="l00160"></a>00160     boxDestroy(&amp;box);
 
263
<a name="l00161"></a>00161   }
 
264
<a name="l00162"></a>00162   boxaDestroy(&amp;regions_to_clear);
 
265
<a name="l00163"></a>00163   pixaDestroy(&amp;ccs);
 
266
<a name="l00164"></a>00164   <span class="keywordflow">if</span> (<a class="code" href="a01106.html#a9687e850f464694be20c21d93e891801">devanagari_split_debugimage</a>) {
 
267
<a name="l00165"></a>00165     <a class="code" href="a00545.html#ac60692d8c95f1ed1505adbd2554ece53">DumpDebugImage</a>(split_for_pageseg ? <span class="stringliteral">&quot;pageseg_split_debug.png&quot;</span> :
 
268
<a name="l00166"></a>00166                    <span class="stringliteral">&quot;ocr_split_debug.png&quot;</span>);
 
269
<a name="l00167"></a>00167   }
 
270
<a name="l00168"></a>00168   <span class="keywordflow">return</span> <span class="keyword">true</span>;
 
271
<a name="l00169"></a>00169 }
 
272
<a name="l00170"></a>00170 
 
273
<a name="l00171"></a>00171 <span class="comment">// Method to perform a close operation on the input image. The xheight</span>
 
274
<a name="l00172"></a>00172 <span class="comment">// estimate decides the size of sel used.</span>
 
275
<a name="l00173"></a>00173 <span class="keywordtype">void</span> ShiroRekhaSplitter::PerformClose(Pix* pix, <span class="keywordtype">int</span> xheight_estimate) {
 
276
<a name="l00174"></a>00174   pixCloseBrick(pix, pix, xheight_estimate / 8, xheight_estimate / 3);
 
277
<a name="l00175"></a>00175 }
 
278
<a name="l00176"></a>00176 
 
279
<a name="l00177"></a>00177 <span class="comment">// This method resolves the cc bbox to a particular row and returns the row&#39;s</span>
 
280
<a name="l00178"></a>00178 <span class="comment">// xheight.</span>
 
281
<a name="l00179"></a>00179 <span class="keywordtype">int</span> ShiroRekhaSplitter::GetXheightForCC(Box* cc_bbox) {
 
282
<a name="l00180"></a>00180   <span class="keywordflow">if</span> (!segmentation_block_list_) {
 
283
<a name="l00181"></a>00181     <span class="keywordflow">return</span> global_xheight_;
 
284
<a name="l00182"></a>00182   }
 
285
<a name="l00183"></a>00183   <span class="comment">// Compute the box coordinates in Tesseract&#39;s coordinate system.</span>
 
286
<a name="l00184"></a>00184   <a class="code" href="a00592.html">TBOX</a> bbox(cc_bbox-&gt;x,
 
287
<a name="l00185"></a>00185             pixGetHeight(orig_pix_) - cc_bbox-&gt;y - cc_bbox-&gt;h - 1,
 
288
<a name="l00186"></a>00186             cc_bbox-&gt;x + cc_bbox-&gt;w,
 
289
<a name="l00187"></a>00187             pixGetHeight(orig_pix_) - cc_bbox-&gt;y - 1);
 
290
<a name="l00188"></a>00188   <span class="comment">// Iterate over all blocks.</span>
 
291
<a name="l00189"></a>00189   BLOCK_IT block_it(segmentation_block_list_);
 
292
<a name="l00190"></a>00190   <span class="keywordflow">for</span> (block_it.mark_cycle_pt(); !block_it.cycled_list(); block_it.forward()) {
 
293
<a name="l00191"></a>00191     <a class="code" href="a00280.html">BLOCK</a>* block = block_it.data();
 
294
<a name="l00192"></a>00192     <span class="comment">// Iterate over all rows in the block.</span>
 
295
<a name="l00193"></a>00193     ROW_IT row_it(block-&gt;<a class="code" href="a00280.html#ae9826e422b0bf17a7592dee8db3fe058" title="get rows">row_list</a>());
 
296
<a name="l00194"></a>00194     <span class="keywordflow">for</span> (row_it.mark_cycle_pt(); !row_it.cycled_list(); row_it.forward()) {
 
297
<a name="l00195"></a>00195       <a class="code" href="a00521.html">ROW</a>* row = row_it.data();
 
298
<a name="l00196"></a>00196       <span class="keywordflow">if</span> (!row-&gt;<a class="code" href="a00521.html#a7bb838e55056e39e15d7e2cea8ebebb0">bounding_box</a>().<a class="code" href="a00592.html#aeabe87a0ee3912ca63550ffee4fb4115">major_overlap</a>(bbox)) {
 
299
<a name="l00197"></a>00197         <span class="keywordflow">continue</span>;
 
300
<a name="l00198"></a>00198       }
 
301
<a name="l00199"></a>00199       <span class="comment">// Row could be skewed, warped, etc. Use the position of the box to</span>
 
302
<a name="l00200"></a>00200       <span class="comment">// determine the baseline position of the row for that x-coordinate.</span>
 
303
<a name="l00201"></a>00201       <span class="comment">// Create a square TBOX whose baseline&#39;s mid-point lies at this point</span>
 
304
<a name="l00202"></a>00202       <span class="comment">// and side is row&#39;s xheight. Take the overlap of this box with the input</span>
 
305
<a name="l00203"></a>00203       <span class="comment">// box and check if it is a &#39;major overlap&#39;. If so, this box lies in this</span>
 
306
<a name="l00204"></a>00204       <span class="comment">// row. In that case, return the xheight for this row.</span>
 
307
<a name="l00205"></a>00205       <span class="keywordtype">float</span> box_middle = 0.5 * (bbox.left() + bbox.right());
 
308
<a name="l00206"></a>00206       <span class="keywordtype">int</span> <a class="code" href="a00921.html#a2a4b69f9a2827dc98bc4cbc233118865a83297de004f4e58b9be2108c6cd08a23">baseline</a> = <span class="keyword">static_cast&lt;</span><span class="keywordtype">int</span><span class="keyword">&gt;</span>(row-&gt;<a class="code" href="a00521.html#a097b3543fa3ca5768eb50033d4c4db9c">base_line</a>(box_middle) + 0.5);
 
309
<a name="l00207"></a>00207       <a class="code" href="a00592.html">TBOX</a> test_box(box_middle - row-&gt;<a class="code" href="a00521.html#a2954f94ec4eefe1e3729912e5b8ea779">x_height</a>() / 2,
 
310
<a name="l00208"></a>00208                     <a class="code" href="a00921.html#a2a4b69f9a2827dc98bc4cbc233118865a83297de004f4e58b9be2108c6cd08a23">baseline</a>,
 
311
<a name="l00209"></a>00209                     box_middle + row-&gt;<a class="code" href="a00521.html#a2954f94ec4eefe1e3729912e5b8ea779">x_height</a>() / 2,
 
312
<a name="l00210"></a>00210                     <span class="keyword">static_cast&lt;</span><span class="keywordtype">int</span><span class="keyword">&gt;</span>(baseline + row-&gt;<a class="code" href="a00521.html#a2954f94ec4eefe1e3729912e5b8ea779">x_height</a>()));
 
313
<a name="l00211"></a>00211       <span class="comment">// Compute overlap. If it is is a major overlap, this is the right row.</span>
 
314
<a name="l00212"></a>00212       <span class="keywordflow">if</span> (bbox.major_overlap(test_box)) {
 
315
<a name="l00213"></a>00213         <span class="keywordflow">return</span> row-&gt;<a class="code" href="a00521.html#a2954f94ec4eefe1e3729912e5b8ea779">x_height</a>();
 
316
<a name="l00214"></a>00214       }
 
317
<a name="l00215"></a>00215     }
 
318
<a name="l00216"></a>00216   }
 
319
<a name="l00217"></a>00217   <span class="comment">// No row found for this bbox.</span>
 
320
<a name="l00218"></a>00218   <span class="keywordflow">return</span> <a class="code" href="a00545.html#ac973904ee08ed3d33aa15afc9dc2a903">kUnspecifiedXheight</a>;
 
321
<a name="l00219"></a>00219 }
 
322
<a name="l00220"></a>00220 
 
323
<a name="l00221"></a>00221 <span class="comment">// Returns a list of regions (boxes) which should be cleared in the original</span>
 
324
<a name="l00222"></a>00222 <span class="comment">// image so as to perform shiro-rekha splitting. Pix is assumed to carry one</span>
 
325
<a name="l00223"></a>00223 <span class="comment">// (or less) word only. Xheight measure could be the global estimate, the row</span>
 
326
<a name="l00224"></a>00224 <span class="comment">// estimate, or unspecified. If unspecified, over splitting may occur, since a</span>
 
327
<a name="l00225"></a>00225 <span class="comment">// conservative estimate of stroke width along with an associated multiplier</span>
 
328
<a name="l00226"></a>00226 <span class="comment">// is used in its place. It is advisable to have a specified xheight when</span>
 
329
<a name="l00227"></a>00227 <span class="comment">// splitting for classification/training.</span>
 
330
<a name="l00228"></a>00228 <span class="comment">// A vertical projection histogram of all the on-pixels in the input pix is</span>
 
331
<a name="l00229"></a>00229 <span class="comment">// computed. The maxima of this histogram is regarded as an approximate location</span>
 
332
<a name="l00230"></a>00230 <span class="comment">// of the shiro-rekha. By descending on the maxima&#39;s peak on both sides,</span>
 
333
<a name="l00231"></a>00231 <span class="comment">// stroke width of shiro-rekha is estimated.</span>
 
334
<a name="l00232"></a>00232 <span class="comment">// A horizontal projection histogram is computed for a sub-image of the input</span>
 
335
<a name="l00233"></a>00233 <span class="comment">// image, which extends from just below the shiro-rekha down to a certain</span>
 
336
<a name="l00234"></a>00234 <span class="comment">// leeway. The leeway depends on the input xheight, if provided, else a</span>
 
337
<a name="l00235"></a>00235 <span class="comment">// conservative multiplier on approximate stroke width is used (which may lead</span>
 
338
<a name="l00236"></a>00236 <span class="comment">// to over-splitting).</span>
 
339
<a name="l00237"></a>00237 <span class="keywordtype">void</span> ShiroRekhaSplitter::SplitWordShiroRekha(SplitStrategy split_strategy,
 
340
<a name="l00238"></a>00238                                              Pix* pix,
 
341
<a name="l00239"></a>00239                                              <span class="keywordtype">int</span> xheight,
 
342
<a name="l00240"></a>00240                                              <span class="keywordtype">int</span> word_left,
 
343
<a name="l00241"></a>00241                                              <span class="keywordtype">int</span> word_top,
 
344
<a name="l00242"></a>00242                                              Boxa* regions_to_clear) {
 
345
<a name="l00243"></a>00243   <span class="keywordflow">if</span> (split_strategy == <a class="code" href="a00545.html#ab44f3b6e26668478841a5b8c45332601a1ca815839c8e78def404b329ba79697a">NO_SPLIT</a>) {
 
346
<a name="l00244"></a>00244     <span class="keywordflow">return</span>;
 
347
<a name="l00245"></a>00245   }
 
348
<a name="l00246"></a>00246   <span class="keywordtype">int</span> width = pixGetWidth(pix);
 
349
<a name="l00247"></a>00247   <span class="keywordtype">int</span> height = pixGetHeight(pix);
 
350
<a name="l00248"></a>00248   <span class="comment">// Statistically determine the yextents of the shiro-rekha.</span>
 
351
<a name="l00249"></a>00249   <span class="keywordtype">int</span> shirorekha_top, shirorekha_bottom, shirorekha_ylevel;
 
352
<a name="l00250"></a>00250   GetShiroRekhaYExtents(pix, &amp;shirorekha_top, &amp;shirorekha_bottom,
 
353
<a name="l00251"></a>00251                         &amp;shirorekha_ylevel);
 
354
<a name="l00252"></a>00252   <span class="comment">// Since the shiro rekha is also a stroke, its width is equal to the stroke</span>
 
355
<a name="l00253"></a>00253   <span class="comment">// width.</span>
 
356
<a name="l00254"></a>00254   <span class="keywordtype">int</span> stroke_width = shirorekha_bottom - shirorekha_top + 1;
 
357
<a name="l00255"></a>00255 
 
358
<a name="l00256"></a>00256   <span class="comment">// Some safeguards to protect CCs we do not want to be split.</span>
 
359
<a name="l00257"></a>00257   <span class="comment">// These are particularly useful when the word wasn&#39;t eliminated earlier</span>
 
360
<a name="l00258"></a>00258   <span class="comment">// because xheight information was unavailable.</span>
 
361
<a name="l00259"></a>00259   <span class="keywordflow">if</span> (shirorekha_ylevel &gt; height / 2) {
 
362
<a name="l00260"></a>00260     <span class="comment">// Shirorekha shouldn&#39;t be in the bottom half of the word.</span>
 
363
<a name="l00261"></a>00261     <span class="keywordflow">if</span> (<a class="code" href="a01106.html#ad6b4d3ded1df0799766c874662d63050">devanagari_split_debuglevel</a> &gt; 0) {
 
364
<a name="l00262"></a>00262       <a class="code" href="a00860.html#a02aa7cca2c3857c14716e8cca96ace6c">tprintf</a>(<span class="stringliteral">&quot;Skipping splitting CC at (%d, %d): shirorekha in lower half..\n&quot;</span>,
 
365
<a name="l00263"></a>00263               word_left, word_top);
 
366
<a name="l00264"></a>00264     }
 
367
<a name="l00265"></a>00265     <span class="keywordflow">return</span>;
 
368
<a name="l00266"></a>00266   }
 
369
<a name="l00267"></a>00267   <span class="keywordflow">if</span> (stroke_width &gt; height / 3) {
 
370
<a name="l00268"></a>00268     <span class="comment">// Even the boldest of fonts shouldn&#39;t do this.</span>
 
371
<a name="l00269"></a>00269     <span class="keywordflow">if</span> (<a class="code" href="a01106.html#ad6b4d3ded1df0799766c874662d63050">devanagari_split_debuglevel</a> &gt; 0) {
 
372
<a name="l00270"></a>00270       <a class="code" href="a00860.html#a02aa7cca2c3857c14716e8cca96ace6c">tprintf</a>(<span class="stringliteral">&quot;Skipping splitting CC at (%d, %d): stroke width too huge..\n&quot;</span>,
 
373
<a name="l00271"></a>00271               word_left, word_top);
 
374
<a name="l00272"></a>00272     }
 
375
<a name="l00273"></a>00273     <span class="keywordflow">return</span>;
 
376
<a name="l00274"></a>00274   }
 
377
<a name="l00275"></a>00275 
 
378
<a name="l00276"></a>00276   <span class="comment">// Clear the ascender and descender regions of the word.</span>
 
379
<a name="l00277"></a>00277   <span class="comment">// Obtain a vertical projection histogram for the resulting image.</span>
 
380
<a name="l00278"></a>00278   Box* box_to_clear = boxCreate(0, shirorekha_top - stroke_width / 3,
 
381
<a name="l00279"></a>00279                                 width, 5 * stroke_width / 3);
 
382
<a name="l00280"></a>00280   Pix* word_in_xheight = pixCopy(NULL, pix);
 
383
<a name="l00281"></a>00281   pixClearInRect(word_in_xheight, box_to_clear);
 
384
<a name="l00282"></a>00282   <span class="comment">// Also clear any pixels which are below shirorekha_bottom + some leeway.</span>
 
385
<a name="l00283"></a>00283   <span class="comment">// The leeway is set to xheight if the information is available, else it is a</span>
 
386
<a name="l00284"></a>00284   <span class="comment">// multiplier applied to the stroke width.</span>
 
387
<a name="l00285"></a>00285   <span class="keywordtype">int</span> leeway_to_keep = stroke_width * 3;
 
388
<a name="l00286"></a>00286   <span class="keywordflow">if</span> (xheight != <a class="code" href="a00545.html#ac973904ee08ed3d33aa15afc9dc2a903">kUnspecifiedXheight</a>) {
 
389
<a name="l00287"></a>00287     <span class="comment">// This is because the xheight-region typically includes the shiro-rekha</span>
 
390
<a name="l00288"></a>00288     <span class="comment">// inside it, i.e., the top of the xheight range corresponds to the top of</span>
 
391
<a name="l00289"></a>00289     <span class="comment">// shiro-rekha.</span>
 
392
<a name="l00290"></a>00290     leeway_to_keep = xheight - stroke_width;
 
393
<a name="l00291"></a>00291   }
 
394
<a name="l00292"></a>00292   box_to_clear-&gt;y = shirorekha_bottom + leeway_to_keep;
 
395
<a name="l00293"></a>00293   box_to_clear-&gt;h = height - box_to_clear-&gt;y;
 
396
<a name="l00294"></a>00294   pixClearInRect(word_in_xheight, box_to_clear);
 
397
<a name="l00295"></a>00295   boxDestroy(&amp;box_to_clear);
 
398
<a name="l00296"></a>00296 
 
399
<a name="l00297"></a>00297   PixelHistogram vert_hist;
 
400
<a name="l00298"></a>00298   vert_hist.ConstructVerticalCountHist(word_in_xheight);
 
401
<a name="l00299"></a>00299   pixDestroy(&amp;word_in_xheight);
 
402
<a name="l00300"></a>00300 
 
403
<a name="l00301"></a>00301   <span class="comment">// If the number of black pixel in any column of the image is less than a</span>
 
404
<a name="l00302"></a>00302   <span class="comment">// fraction of the stroke width, treat it as noise / a stray mark. Perform</span>
 
405
<a name="l00303"></a>00303   <span class="comment">// these changes inside the vert_hist data itself, as that is used later on as</span>
 
406
<a name="l00304"></a>00304   <span class="comment">// a bit vector for the final split decision at every column.</span>
 
407
<a name="l00305"></a>00305   <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 0; i &lt; width; ++i) {
 
408
<a name="l00306"></a>00306     <span class="keywordflow">if</span> (vert_hist.hist()[i] &lt;= stroke_width / 4)
 
409
<a name="l00307"></a>00307       vert_hist.hist()[i] = 0;
 
410
<a name="l00308"></a>00308     <span class="keywordflow">else</span>
 
411
<a name="l00309"></a>00309       vert_hist.hist()[i] = 1;
 
412
<a name="l00310"></a>00310   }
 
413
<a name="l00311"></a>00311   <span class="comment">// In order to split the line at any point, we make sure that the width of the</span>
 
414
<a name="l00312"></a>00312   <span class="comment">// gap is atleast half the stroke width.</span>
 
415
<a name="l00313"></a>00313   <span class="keywordtype">int</span> i = 0;
 
416
<a name="l00314"></a>00314   <span class="keywordtype">int</span> cur_component_width = 0;
 
417
<a name="l00315"></a>00315   <span class="keywordflow">while</span> (i &lt; width) {
 
418
<a name="l00316"></a>00316     <span class="keywordflow">if</span> (!vert_hist.hist()[i]) {
 
419
<a name="l00317"></a>00317       <span class="keywordtype">int</span> j = 0;
 
420
<a name="l00318"></a>00318       <span class="keywordflow">while</span> (i + j &lt; width &amp;&amp; !vert_hist.hist()[i+j])
 
421
<a name="l00319"></a>00319         ++j;
 
422
<a name="l00320"></a>00320       <span class="keywordflow">if</span> (j &gt;= stroke_width / 2 &amp;&amp; cur_component_width &gt;= stroke_width / 2) {
 
423
<a name="l00321"></a>00321         <span class="comment">// Perform a shiro-rekha split. The intervening region lies from i to</span>
 
424
<a name="l00322"></a>00322         <span class="comment">// i+j-1.</span>
 
425
<a name="l00323"></a>00323         <span class="comment">// A minimal single-pixel split makes the estimation of intra- and</span>
 
426
<a name="l00324"></a>00324         <span class="comment">// inter-word spacing easier during page layout analysis,</span>
 
427
<a name="l00325"></a>00325         <span class="comment">// whereas a maximal split may be needed for OCR, depending on</span>
 
428
<a name="l00326"></a>00326         <span class="comment">// how the engine was trained.</span>
 
429
<a name="l00327"></a>00327         <span class="keywordtype">bool</span> minimal_split = (split_strategy == <a class="code" href="a00545.html#ab44f3b6e26668478841a5b8c45332601abb20813b04f412bb19593e228c343503">MINIMAL_SPLIT</a>);
 
430
<a name="l00328"></a>00328         <span class="keywordtype">int</span> split_width = minimal_split ? 1 : j;
 
431
<a name="l00329"></a>00329         <span class="keywordtype">int</span> split_left = minimal_split ? i + (j / 2) - (split_width / 2) : i;
 
432
<a name="l00330"></a>00330         <span class="keywordflow">if</span> (!minimal_split || (i != 0 &amp;&amp; i + j != width)) {
 
433
<a name="l00331"></a>00331           Box* box_to_clear =
 
434
<a name="l00332"></a>00332               boxCreate(word_left + split_left,
 
435
<a name="l00333"></a>00333                         word_top + shirorekha_top - stroke_width / 3,
 
436
<a name="l00334"></a>00334                         split_width,
 
437
<a name="l00335"></a>00335                         5 * stroke_width / 3);
 
438
<a name="l00336"></a>00336           <span class="keywordflow">if</span> (box_to_clear) {
 
439
<a name="l00337"></a>00337             boxaAddBox(regions_to_clear, box_to_clear, L_CLONE);
 
440
<a name="l00338"></a>00338             <span class="comment">// Mark this in the debug image if needed.</span>
 
441
<a name="l00339"></a>00339             <span class="keywordflow">if</span> (<a class="code" href="a01106.html#a9687e850f464694be20c21d93e891801">devanagari_split_debugimage</a>) {
 
442
<a name="l00340"></a>00340               pixRenderBoxArb(debug_image_, box_to_clear, 1, 128, 255, 128);
 
443
<a name="l00341"></a>00341             }
 
444
<a name="l00342"></a>00342             boxDestroy(&amp;box_to_clear);
 
445
<a name="l00343"></a>00343             cur_component_width = 0;
 
446
<a name="l00344"></a>00344           }
 
447
<a name="l00345"></a>00345         }
 
448
<a name="l00346"></a>00346       }
 
449
<a name="l00347"></a>00347       i += j;
 
450
<a name="l00348"></a>00348     } <span class="keywordflow">else</span> {
 
451
<a name="l00349"></a>00349       ++i;
 
452
<a name="l00350"></a>00350       ++cur_component_width;
 
453
<a name="l00351"></a>00351     }
 
454
<a name="l00352"></a>00352   }
 
455
<a name="l00353"></a>00353 }
 
456
<a name="l00354"></a>00354 
 
457
<a name="l00355"></a>00355 <span class="comment">// Refreshes the words in the segmentation block list by using blobs in the</span>
 
458
<a name="l00356"></a>00356 <span class="comment">// input block list.</span>
 
459
<a name="l00357"></a>00357 <span class="comment">// The segmentation block list must be set.</span>
 
460
<a name="l00358"></a><a class="code" href="a00545.html#a90146104b2c9a136fdd873036cb95230">00358</a> <span class="keywordtype">void</span> <a class="code" href="a00545.html#a90146104b2c9a136fdd873036cb95230">ShiroRekhaSplitter::RefreshSegmentationWithNewBlobs</a>(
 
461
<a name="l00359"></a>00359     C_BLOB_LIST* new_blobs) {
 
462
<a name="l00360"></a>00360   <span class="comment">// The segmentation block list must have been specified.</span>
 
463
<a name="l00361"></a>00361   <a class="code" href="a00823.html#a93a603f4063a6b9403d81caa245a583b">ASSERT_HOST</a>(segmentation_block_list_);
 
464
<a name="l00362"></a>00362   <span class="keywordflow">if</span> (<a class="code" href="a01106.html#ad6b4d3ded1df0799766c874662d63050">devanagari_split_debuglevel</a> &gt; 0) {
 
465
<a name="l00363"></a>00363     <a class="code" href="a00860.html#a02aa7cca2c3857c14716e8cca96ace6c">tprintf</a>(<span class="stringliteral">&quot;Before refreshing blobs:\n&quot;</span>);
 
466
<a name="l00364"></a>00364     <a class="code" href="a00760.html#a7f48b20c8959347726c816b94b3c47f5">PrintSegmentationStats</a>(segmentation_block_list_);
 
467
<a name="l00365"></a>00365     <a class="code" href="a00860.html#a02aa7cca2c3857c14716e8cca96ace6c">tprintf</a>(<span class="stringliteral">&quot;New Blobs found: %d\n&quot;</span>, new_blobs-&gt;length());
 
468
<a name="l00366"></a>00366   }
 
469
<a name="l00367"></a>00367 
 
470
<a name="l00368"></a>00368   C_BLOB_LIST not_found_blobs;
 
471
<a name="l00369"></a>00369   <a class="code" href="a00760.html#af0a18fdb19dd9d4ebe9e73b864c2fad5">RefreshWordBlobsFromNewBlobs</a>(segmentation_block_list_,
 
472
<a name="l00370"></a>00370                                new_blobs,
 
473
<a name="l00371"></a>00371                                ((<a class="code" href="a01106.html#a9687e850f464694be20c21d93e891801">devanagari_split_debugimage</a> &amp;&amp; debug_image_) ?
 
474
<a name="l00372"></a>00372                                 &amp;not_found_blobs : NULL));
 
475
<a name="l00373"></a>00373 
 
476
<a name="l00374"></a>00374   <span class="keywordflow">if</span> (<a class="code" href="a01106.html#ad6b4d3ded1df0799766c874662d63050">devanagari_split_debuglevel</a> &gt; 0) {
 
477
<a name="l00375"></a>00375     <a class="code" href="a00860.html#a02aa7cca2c3857c14716e8cca96ace6c">tprintf</a>(<span class="stringliteral">&quot;After refreshing blobs:\n&quot;</span>);
 
478
<a name="l00376"></a>00376     <a class="code" href="a00760.html#a7f48b20c8959347726c816b94b3c47f5">PrintSegmentationStats</a>(segmentation_block_list_);
 
479
<a name="l00377"></a>00377   }
 
480
<a name="l00378"></a>00378   <span class="keywordflow">if</span> (<a class="code" href="a01106.html#a9687e850f464694be20c21d93e891801">devanagari_split_debugimage</a> &amp;&amp; debug_image_) {
 
481
<a name="l00379"></a>00379     <span class="comment">// Plot out the original blobs for which no match was found in the new</span>
 
482
<a name="l00380"></a>00380     <span class="comment">// all_blobs list.</span>
 
483
<a name="l00381"></a>00381     C_BLOB_IT not_found_it(&amp;not_found_blobs);
 
484
<a name="l00382"></a>00382     <span class="keywordflow">for</span> (not_found_it.mark_cycle_pt(); !not_found_it.cycled_list();
 
485
<a name="l00383"></a>00383          not_found_it.forward()) {
 
486
<a name="l00384"></a>00384       <a class="code" href="a00289.html">C_BLOB</a>* not_found = not_found_it.data();
 
487
<a name="l00385"></a>00385       <a class="code" href="a00592.html">TBOX</a> not_found_box = not_found-&gt;<a class="code" href="a00289.html#a77e52e29e2c622a3a63bb7edb110f6ab">bounding_box</a>();
 
488
<a name="l00386"></a>00386       Box* box_to_plot = GetBoxForTBOX(not_found_box);
 
489
<a name="l00387"></a>00387       pixRenderBoxArb(debug_image_, box_to_plot, 1, 255, 0, 255);
 
490
<a name="l00388"></a>00388       boxDestroy(&amp;box_to_plot);
 
491
<a name="l00389"></a>00389     }
 
492
<a name="l00390"></a>00390 
 
493
<a name="l00391"></a>00391     <span class="comment">// Plot out the blobs unused from all blobs.</span>
 
494
<a name="l00392"></a>00392     C_BLOB_IT all_blobs_it(new_blobs);
 
495
<a name="l00393"></a>00393     <span class="keywordflow">for</span> (all_blobs_it.mark_cycle_pt(); !all_blobs_it.cycled_list();
 
496
<a name="l00394"></a>00394          all_blobs_it.forward()) {
 
497
<a name="l00395"></a>00395       <a class="code" href="a00289.html">C_BLOB</a>* a_blob = all_blobs_it.data();
 
498
<a name="l00396"></a>00396       Box* box_to_plot = GetBoxForTBOX(a_blob-&gt;<a class="code" href="a00289.html#a77e52e29e2c622a3a63bb7edb110f6ab">bounding_box</a>());
 
499
<a name="l00397"></a>00397       pixRenderBoxArb(debug_image_, box_to_plot, 3, 0, 127, 0);
 
500
<a name="l00398"></a>00398       boxDestroy(&amp;box_to_plot);
 
501
<a name="l00399"></a>00399     }
 
502
<a name="l00400"></a>00400   }
 
503
<a name="l00401"></a>00401 }
 
504
<a name="l00402"></a>00402 
 
505
<a name="l00403"></a>00403 <span class="comment">// Returns a new box object for the corresponding TBOX, based on the original</span>
 
506
<a name="l00404"></a>00404 <span class="comment">// image&#39;s coordinate system.</span>
 
507
<a name="l00405"></a>00405 Box* ShiroRekhaSplitter::GetBoxForTBOX(<span class="keyword">const</span> <a class="code" href="a00592.html">TBOX</a>&amp; tbox)<span class="keyword"> const </span>{
 
508
<a name="l00406"></a>00406   <span class="keywordflow">return</span> boxCreate(tbox.<a class="code" href="a00592.html#a724fabf566586b663577dfa944ffbc61">left</a>(), pixGetHeight(orig_pix_) - tbox.<a class="code" href="a00592.html#adf92e9fdac1bdf11c10d1c4d1178791a">top</a>() - 1,
 
509
<a name="l00407"></a>00407                    tbox.<a class="code" href="a00592.html#af95494a2ccacc70cc2b83820b2948619">width</a>(), tbox.<a class="code" href="a00592.html#a8379d4bbc72bdbb1f069fc14790e632d">height</a>());
 
510
<a name="l00408"></a>00408 }
 
511
<a name="l00409"></a>00409 
 
512
<a name="l00410"></a>00410 <span class="comment">// This method returns the computed mode-height of blobs in the pix.</span>
 
513
<a name="l00411"></a>00411 <span class="comment">// It also prunes very small blobs from calculation.</span>
 
514
<a name="l00412"></a><a class="code" href="a00545.html#a99f3f8f96a8b7bfe08ce2b19c8052a6c">00412</a> <span class="keywordtype">int</span> <a class="code" href="a00545.html#a99f3f8f96a8b7bfe08ce2b19c8052a6c">ShiroRekhaSplitter::GetModeHeight</a>(Pix* pix) {
 
515
<a name="l00413"></a>00413   Boxa* boxa = pixConnComp(pix, NULL, 8);
 
516
<a name="l00414"></a>00414   <a class="code" href="a00556.html">STATS</a> heights(0, pixGetHeight(pix));
 
517
<a name="l00415"></a>00415   heights.<a class="code" href="a00556.html#a28e9fd9515ea3b35e3f66ed078e285a6">clear</a>();
 
518
<a name="l00416"></a>00416   <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 0; i &lt; boxaGetCount(boxa); ++i) {
 
519
<a name="l00417"></a>00417     Box* box = boxaGetBox(boxa, i, L_CLONE);
 
520
<a name="l00418"></a>00418     <span class="keywordflow">if</span> (box-&gt;h &gt;= 3 || box-&gt;w &gt;= 3) {
 
521
<a name="l00419"></a>00419       heights.<a class="code" href="a00556.html#ab8cacba14df28eed1bffc4cea0b2f87f">add</a>(box-&gt;h, 1);
 
522
<a name="l00420"></a>00420     }
 
523
<a name="l00421"></a>00421     boxDestroy(&amp;box);
 
524
<a name="l00422"></a>00422   }
 
525
<a name="l00423"></a>00423   boxaDestroy(&amp;boxa);
 
526
<a name="l00424"></a>00424   <span class="keywordflow">return</span> heights.<a class="code" href="a00556.html#a5d353e951f61daf06c6582dfc106ff11">mode</a>();
 
527
<a name="l00425"></a>00425 }
 
528
<a name="l00426"></a>00426 
 
529
<a name="l00427"></a>00427 <span class="comment">// This method returns y-extents of the shiro-rekha computed from the input</span>
 
530
<a name="l00428"></a>00428 <span class="comment">// word image.</span>
 
531
<a name="l00429"></a>00429 <span class="keywordtype">void</span> ShiroRekhaSplitter::GetShiroRekhaYExtents(Pix* word_pix,
 
532
<a name="l00430"></a>00430                                                <span class="keywordtype">int</span>* shirorekha_top,
 
533
<a name="l00431"></a>00431                                                <span class="keywordtype">int</span>* shirorekha_bottom,
 
534
<a name="l00432"></a>00432                                                <span class="keywordtype">int</span>* shirorekha_ylevel) {
 
535
<a name="l00433"></a>00433   <span class="comment">// Compute a histogram from projecting the word on a vertical line.</span>
 
536
<a name="l00434"></a>00434   <a class="code" href="a00503.html">PixelHistogram</a> hist_horiz;
 
537
<a name="l00435"></a>00435   hist_horiz.<a class="code" href="a00503.html#a7d423f56f2e8440301f8af11a952fade">ConstructHorizontalCountHist</a>(word_pix);
 
538
<a name="l00436"></a>00436   <span class="comment">// Get the ylevel where the top-line exists. This is basically the global</span>
 
539
<a name="l00437"></a>00437   <span class="comment">// maxima in the horizontal histogram.</span>
 
540
<a name="l00438"></a>00438   <span class="keywordtype">int</span> topline_onpixel_count = 0;
 
541
<a name="l00439"></a>00439   <span class="keywordtype">int</span> topline_ylevel = hist_horiz.<a class="code" href="a00503.html#ac984a3128e256cdc178cc33da1d81238">GetHistogramMaximum</a>(&amp;topline_onpixel_count);
 
542
<a name="l00440"></a>00440 
 
543
<a name="l00441"></a>00441   <span class="comment">// Get the upper and lower extents of the shiro rekha.</span>
 
544
<a name="l00442"></a>00442   <span class="keywordtype">int</span> thresh = (topline_onpixel_count * 70) / 100;
 
545
<a name="l00443"></a>00443   <span class="keywordtype">int</span> ulimit = topline_ylevel;
 
546
<a name="l00444"></a>00444   <span class="keywordtype">int</span> llimit = topline_ylevel;
 
547
<a name="l00445"></a>00445   <span class="keywordflow">while</span> (ulimit &gt; 0 &amp;&amp; hist_horiz.<a class="code" href="a00503.html#abd202025de01aaf80fa2a852d0fcb38d">hist</a>()[ulimit] &gt;= thresh)
 
548
<a name="l00446"></a>00446     --ulimit;
 
549
<a name="l00447"></a>00447   <span class="keywordflow">while</span> (llimit &lt; pixGetHeight(word_pix) &amp;&amp; hist_horiz.<a class="code" href="a00503.html#abd202025de01aaf80fa2a852d0fcb38d">hist</a>()[llimit] &gt;= thresh)
 
550
<a name="l00448"></a>00448     ++llimit;
 
551
<a name="l00449"></a>00449 
 
552
<a name="l00450"></a>00450   <span class="keywordflow">if</span> (shirorekha_top) *shirorekha_top = ulimit;
 
553
<a name="l00451"></a>00451   <span class="keywordflow">if</span> (shirorekha_bottom) *shirorekha_bottom = llimit;
 
554
<a name="l00452"></a>00452   <span class="keywordflow">if</span> (shirorekha_ylevel) *shirorekha_ylevel = topline_ylevel;
 
555
<a name="l00453"></a>00453 }
 
556
<a name="l00454"></a>00454 
 
557
<a name="l00455"></a>00455 <span class="comment">// This method returns the global-maxima for the histogram. The frequency of</span>
 
558
<a name="l00456"></a>00456 <span class="comment">// the global maxima is returned in count, if specified.</span>
 
559
<a name="l00457"></a><a class="code" href="a00503.html#ac984a3128e256cdc178cc33da1d81238">00457</a> <span class="keywordtype">int</span> <a class="code" href="a00503.html#ac984a3128e256cdc178cc33da1d81238">PixelHistogram::GetHistogramMaximum</a>(<span class="keywordtype">int</span>* <a class="code" href="a01042.html#acd4ea858d7133e40518e0832ff9d94b2">count</a>)<span class="keyword"> const </span>{
 
560
<a name="l00458"></a>00458   <span class="keywordtype">int</span> best_value = 0;
 
561
<a name="l00459"></a>00459   <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 0; i &lt; length_; ++i) {
 
562
<a name="l00460"></a>00460     <span class="keywordflow">if</span> (hist_[i] &gt; hist_[best_value]) {
 
563
<a name="l00461"></a>00461       best_value = i;
 
564
<a name="l00462"></a>00462     }
 
565
<a name="l00463"></a>00463   }
 
566
<a name="l00464"></a>00464   <span class="keywordflow">if</span> (count) {
 
567
<a name="l00465"></a>00465     *count = hist_[best_value];
 
568
<a name="l00466"></a>00466   }
 
569
<a name="l00467"></a>00467   <span class="keywordflow">return</span> best_value;
 
570
<a name="l00468"></a>00468 }
 
571
<a name="l00469"></a>00469 
 
572
<a name="l00470"></a>00470 <span class="comment">// Methods to construct histograms from images.</span>
 
573
<a name="l00471"></a><a class="code" href="a00503.html#ae6f0d2fd25a0a76b84e370aac7f7b58f">00471</a> <span class="keywordtype">void</span> <a class="code" href="a00503.html#ae6f0d2fd25a0a76b84e370aac7f7b58f">PixelHistogram::ConstructVerticalCountHist</a>(Pix* pix) {
 
574
<a name="l00472"></a>00472   <a class="code" href="a00503.html#aaa214752dc7cbb3923fcece5dff758ed">Clear</a>();
 
575
<a name="l00473"></a>00473   <span class="keywordtype">int</span> width = pixGetWidth(pix);
 
576
<a name="l00474"></a>00474   <span class="keywordtype">int</span> height = pixGetHeight(pix);
 
577
<a name="l00475"></a>00475   hist_ = <span class="keyword">new</span> <span class="keywordtype">int</span>[width];
 
578
<a name="l00476"></a>00476   length_ = width;
 
579
<a name="l00477"></a>00477   <span class="keywordtype">int</span> wpl = pixGetWpl(pix);
 
580
<a name="l00478"></a>00478   l_uint32 *data = pixGetData(pix);
 
581
<a name="l00479"></a>00479   <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 0; i &lt; width; ++i)
 
582
<a name="l00480"></a>00480     hist_[i] = 0;
 
583
<a name="l00481"></a>00481   <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 0; i &lt; height; ++i) {
 
584
<a name="l00482"></a>00482     l_uint32 *line = data + i * wpl;
 
585
<a name="l00483"></a>00483     <span class="keywordflow">for</span> (<span class="keywordtype">int</span> j = 0; j &lt; width; ++j)
 
586
<a name="l00484"></a>00484       <span class="keywordflow">if</span> (GET_DATA_BIT(line, j))
 
587
<a name="l00485"></a>00485         ++(hist_[j]);
 
588
<a name="l00486"></a>00486   }
 
589
<a name="l00487"></a>00487 }
 
590
<a name="l00488"></a>00488 
 
591
<a name="l00489"></a><a class="code" href="a00503.html#a7d423f56f2e8440301f8af11a952fade">00489</a> <span class="keywordtype">void</span> <a class="code" href="a00503.html#a7d423f56f2e8440301f8af11a952fade">PixelHistogram::ConstructHorizontalCountHist</a>(Pix* pix) {
 
592
<a name="l00490"></a>00490   <a class="code" href="a00503.html#aaa214752dc7cbb3923fcece5dff758ed">Clear</a>();
 
593
<a name="l00491"></a>00491   Numa* counts = pixCountPixelsByRow(pix, NULL);
 
594
<a name="l00492"></a>00492   length_ = numaGetCount(counts);
 
595
<a name="l00493"></a>00493   hist_ = <span class="keyword">new</span> <span class="keywordtype">int</span>[length_];
 
596
<a name="l00494"></a>00494   <span class="keywordflow">for</span> (<span class="keywordtype">int</span> i = 0; i &lt; length_; ++i) {
 
597
<a name="l00495"></a>00495     l_int32 val = 0;
 
598
<a name="l00496"></a>00496     numaGetIValue(counts, i, &amp;val);
 
599
<a name="l00497"></a>00497     hist_[i] = val;
 
600
<a name="l00498"></a>00498   }
 
601
<a name="l00499"></a>00499   numaDestroy(&amp;counts);
 
602
<a name="l00500"></a>00500 }
 
603
<a name="l00501"></a>00501 
 
604
<a name="l00502"></a>00502 }  <span class="comment">// namespace tesseract.</span>
 
605
</pre></div></div><!-- contents -->
 
606
</div>
 
607
<!-- window showing the filter options -->
 
608
<div id="MSearchSelectWindow"
 
609
     onmouseover="return searchBox.OnSearchSelectShow()"
 
610
     onmouseout="return searchBox.OnSearchSelectHide()"
 
611
     onkeydown="return searchBox.OnSearchSelectKey(event)">
 
612
<a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(0)"><span class="SelectionMark">&#160;</span>All</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(1)"><span class="SelectionMark">&#160;</span>Classes</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(2)"><span class="SelectionMark">&#160;</span>Namespaces</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(3)"><span class="SelectionMark">&#160;</span>Files</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(4)"><span class="SelectionMark">&#160;</span>Functions</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(5)"><span class="SelectionMark">&#160;</span>Variables</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(6)"><span class="SelectionMark">&#160;</span>Typedefs</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(7)"><span class="SelectionMark">&#160;</span>Enumerations</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(8)"><span class="SelectionMark">&#160;</span>Enumerator</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(9)"><span class="SelectionMark">&#160;</span>Friends</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(10)"><span class="SelectionMark">&#160;</span>Defines</a></div>
 
613
 
 
614
<!-- iframe showing the search results (closed by default) -->
 
615
<div id="MSearchResultsWindow">
 
616
<iframe src="javascript:void(0)" frameborder="0" 
 
617
        name="MSearchResults" id="MSearchResults">
 
618
</iframe>
 
619
</div>
 
620
 
 
621
  <div id="nav-path" class="navpath">
 
622
    <ul>
 
623
      <li class="navelem"><a class="el" href="a01106.html">devanagari_processing.cpp</a>      </li>
 
624
 
 
625
    <li class="footer">Generated on Mon Feb 3 2014 10:59:10 for tesseract by
 
626
    <a href="http://www.doxygen.org/index.html">
 
627
    <img class="footer" src="doxygen.png" alt="doxygen"/></a> 1.7.6.1 </li>
 
628
   </ul>
 
629
 </div>
 
630
 
 
631
 
 
632
</body>
 
633
</html>