1
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
2
<html xmlns="http://www.w3.org/1999/xhtml">
4
<meta http-equiv="Content-Type" content="text/xhtml;charset=UTF-8"/>
5
<meta http-equiv="X-UA-Compatible" content="IE=9"/>
6
<title>tesseract: /usr/local/google/home/jbreiden/tesseract-ocr-read-only/cube/classifier_base.h Source File</title>
8
<link href="tabs.css" rel="stylesheet" type="text/css"/>
9
<link href="doxygen.css" rel="stylesheet" type="text/css" />
10
<link href="navtree.css" rel="stylesheet" type="text/css"/>
11
<script type="text/javascript" src="jquery.js"></script>
12
<script type="text/javascript" src="resize.js"></script>
13
<script type="text/javascript" src="navtree.js"></script>
14
<script type="text/javascript">
15
$(document).ready(initResizable);
17
<link href="search/search.css" rel="stylesheet" type="text/css"/>
18
<script type="text/javascript" src="search/search.js"></script>
19
<script type="text/javascript">
20
$(document).ready(function() { searchBox.OnSelectItem(0); });
25
<div id="top"><!-- do not remove this div! -->
29
<table cellspacing="0" cellpadding="0">
31
<tr style="height: 56px;">
34
<td style="padding-left: 0.5em;">
35
<div id="projectname">tesseract
36
 <span id="projectnumber">3.03</span>
48
<!-- Generated by Doxygen 1.7.6.1 -->
49
<script type="text/javascript">
50
var searchBox = new SearchBox("searchBox", "search",false,'Search');
52
<div id="navrow1" class="tabs">
54
<li><a href="index.html"><span>Main Page</span></a></li>
55
<li><a href="pages.html"><span>Related Pages</span></a></li>
56
<li><a href="modules.html"><span>Modules</span></a></li>
57
<li><a href="namespaces.html"><span>Namespaces</span></a></li>
58
<li><a href="annotated.html"><span>Classes</span></a></li>
59
<li class="current"><a href="files.html"><span>Files</span></a></li>
61
<div id="MSearchBox" class="MSearchBoxInactive">
63
<img id="MSearchSelect" src="search/mag_sel.png"
64
onmouseover="return searchBox.OnSearchSelectShow()"
65
onmouseout="return searchBox.OnSearchSelectHide()"
67
<input type="text" id="MSearchField" value="Search" accesskey="S"
68
onfocus="searchBox.OnSearchFieldFocus(true)"
69
onblur="searchBox.OnSearchFieldFocus(false)"
70
onkeyup="searchBox.OnSearchFieldChange(event)"/>
71
</span><span class="right">
72
<a id="MSearchClose" href="javascript:searchBox.CloseResultsWindow()"><img id="MSearchCloseImg" border="0" src="search/close.png" alt=""/></a>
78
<div id="navrow2" class="tabs2">
80
<li><a href="files.html"><span>File List</span></a></li>
81
<li><a href="globals.html"><span>File Members</span></a></li>
85
<div id="side-nav" class="ui-resizable side-nav-resizable">
87
<div id="nav-tree-contents">
90
<div id="splitbar" style="-moz-user-select:none;"
91
class="ui-resizable-handle">
94
<script type="text/javascript">
95
initNavTree('a00972.html','');
97
<div id="doc-content">
99
<div class="headertitle">
100
<div class="title">/usr/local/google/home/jbreiden/tesseract-ocr-read-only/cube/classifier_base.h</div> </div>
102
<div class="contents">
103
<a href="a00972.html">Go to the documentation of this file.</a><div class="fragment"><pre class="fragment"><a name="l00001"></a>00001 <span class="comment">/**********************************************************************</span>
104
<a name="l00002"></a>00002 <span class="comment"> * File: classifier_base.h</span>
105
<a name="l00003"></a>00003 <span class="comment"> * Description: Declaration of the Base Character Classifier</span>
106
<a name="l00004"></a>00004 <span class="comment"> * Author: Ahmad Abdulkader</span>
107
<a name="l00005"></a>00005 <span class="comment"> * Created: 2007</span>
108
<a name="l00006"></a>00006 <span class="comment"> *</span>
109
<a name="l00007"></a>00007 <span class="comment"> * (C) Copyright 2008, Google Inc.</span>
110
<a name="l00008"></a>00008 <span class="comment"> ** Licensed under the Apache License, Version 2.0 (the "License");</span>
111
<a name="l00009"></a>00009 <span class="comment"> ** you may not use this file except in compliance with the License.</span>
112
<a name="l00010"></a>00010 <span class="comment"> ** You may obtain a copy of the License at</span>
113
<a name="l00011"></a>00011 <span class="comment"> ** http://www.apache.org/licenses/LICENSE-2.0</span>
114
<a name="l00012"></a>00012 <span class="comment"> ** Unless required by applicable law or agreed to in writing, software</span>
115
<a name="l00013"></a>00013 <span class="comment"> ** distributed under the License is distributed on an "AS IS" BASIS,</span>
116
<a name="l00014"></a>00014 <span class="comment"> ** WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.</span>
117
<a name="l00015"></a>00015 <span class="comment"> ** See the License for the specific language governing permissions and</span>
118
<a name="l00016"></a>00016 <span class="comment"> ** limitations under the License.</span>
119
<a name="l00017"></a>00017 <span class="comment"> *</span>
120
<a name="l00018"></a>00018 <span class="comment"> **********************************************************************/</span>
121
<a name="l00019"></a>00019
122
<a name="l00020"></a>00020 <span class="comment">// The CharClassifier class is the abstract class for any character/grapheme</span>
123
<a name="l00021"></a>00021 <span class="comment">// classifier.</span>
124
<a name="l00022"></a>00022
125
<a name="l00023"></a>00023 <span class="preprocessor">#ifndef CHAR_CLASSIFIER_BASE_H</span>
126
<a name="l00024"></a>00024 <span class="preprocessor"></span><span class="preprocessor">#define CHAR_CLASSIFIER_BASE_H</span>
127
<a name="l00025"></a>00025 <span class="preprocessor"></span>
128
<a name="l00026"></a>00026 <span class="preprocessor">#include <string></span>
129
<a name="l00027"></a>00027 <span class="preprocessor">#include "<a class="code" href="a00965.html">char_samp.h</a>"</span>
130
<a name="l00028"></a>00028 <span class="preprocessor">#include "<a class="code" href="a00961.html">char_altlist.h</a>"</span>
131
<a name="l00029"></a>00029 <span class="preprocessor">#include "<a class="code" href="a00971.html">char_set.h</a>"</span>
132
<a name="l00030"></a>00030 <span class="preprocessor">#include "<a class="code" href="a00992.html">feature_base.h</a>"</span>
133
<a name="l00031"></a>00031 <span class="preprocessor">#include "<a class="code" href="a01002.html">lang_model.h</a>"</span>
134
<a name="l00032"></a>00032 <span class="preprocessor">#include "<a class="code" href="a01013.html">tuning_params.h</a>"</span>
135
<a name="l00033"></a>00033
136
<a name="l00034"></a>00034 <span class="keyword">namespace </span><a class="code" href="a01266.html#afed58feacb84df2de88bdd613cfdba6d">tesseract</a> {
137
<a name="l00035"></a><a class="code" href="a00304.html">00035</a> <span class="keyword">class </span><a class="code" href="a00304.html">CharClassifier</a> {
138
<a name="l00036"></a>00036 <span class="keyword">public</span>:
139
<a name="l00037"></a><a class="code" href="a00304.html#a08c3672c2062828c840d830c7a16639b">00037</a> <a class="code" href="a00304.html#a08c3672c2062828c840d830c7a16639b">CharClassifier</a>(<a class="code" href="a00309.html">CharSet</a> *char_set, <a class="code" href="a00634.html">TuningParams</a> *params,
140
<a name="l00038"></a>00038 <a class="code" href="a00381.html">FeatureBase</a> *feat_extract) {
141
<a name="l00039"></a>00039 <a class="code" href="a00304.html#afbe25062436573d4a3b8c9e9936f6013">char_set_</a> = char_set;
142
<a name="l00040"></a>00040 <a class="code" href="a00304.html#af2e7491d921d252957ae0ea4cdaf9aff">params_</a> = params;
143
<a name="l00041"></a>00041 <a class="code" href="a00304.html#ab8e30443f3f9a1d1e9ca5640608a47a8">feat_extract_</a> = feat_extract;
144
<a name="l00042"></a>00042 <a class="code" href="a00304.html#ad7acb8330f63320bb636c66d31b815dc">fold_sets_</a> = NULL;
145
<a name="l00043"></a>00043 <a class="code" href="a00304.html#aa00adf41e98123f259e463b037908db7">fold_set_cnt_</a> = 0;
146
<a name="l00044"></a>00044 <a class="code" href="a00304.html#a883ce8cb0ee930611abcd061153a3be2">fold_set_len_</a> = NULL;
147
<a name="l00045"></a>00045 <a class="code" href="a00304.html#ac5b9df929e2570650b263f0a1504125b">init_</a> = <span class="keyword">false</span>;
148
<a name="l00046"></a>00046 <a class="code" href="a00304.html#aaabb1acf1d7ebcd2b66e1f9796cc49dc">case_sensitive_</a> = <span class="keyword">true</span>;
149
<a name="l00047"></a>00047 }
150
<a name="l00048"></a>00048
151
<a name="l00049"></a><a class="code" href="a00304.html#afac874bedbc52b288b5e064bed170dce">00049</a> <span class="keyword">virtual</span> <a class="code" href="a00304.html#afac874bedbc52b288b5e064bed170dce">~CharClassifier</a>() {
152
<a name="l00050"></a>00050 <span class="keywordflow">if</span> (<a class="code" href="a00304.html#ad7acb8330f63320bb636c66d31b815dc">fold_sets_</a> != NULL) {
153
<a name="l00051"></a>00051 <span class="keywordflow">for</span> (<span class="keywordtype">int</span> fold_set = 0; fold_set < <a class="code" href="a00304.html#aa00adf41e98123f259e463b037908db7">fold_set_cnt_</a>; fold_set++) {
154
<a name="l00052"></a>00052 <span class="keywordflow">if</span> (<a class="code" href="a00304.html#ad7acb8330f63320bb636c66d31b815dc">fold_sets_</a>[fold_set] != NULL) {
155
<a name="l00053"></a>00053 <span class="keyword">delete</span> []<a class="code" href="a00304.html#ad7acb8330f63320bb636c66d31b815dc">fold_sets_</a>[fold_set];
156
<a name="l00054"></a>00054 }
157
<a name="l00055"></a>00055 }
158
<a name="l00056"></a>00056 <span class="keyword">delete</span> []<a class="code" href="a00304.html#ad7acb8330f63320bb636c66d31b815dc">fold_sets_</a>;
159
<a name="l00057"></a>00057 <a class="code" href="a00304.html#ad7acb8330f63320bb636c66d31b815dc">fold_sets_</a> = NULL;
160
<a name="l00058"></a>00058 }
161
<a name="l00059"></a>00059 <span class="keywordflow">if</span> (<a class="code" href="a00304.html#a883ce8cb0ee930611abcd061153a3be2">fold_set_len_</a> != NULL) {
162
<a name="l00060"></a>00060 <span class="keyword">delete</span> []<a class="code" href="a00304.html#a883ce8cb0ee930611abcd061153a3be2">fold_set_len_</a>;
163
<a name="l00061"></a>00061 <a class="code" href="a00304.html#a883ce8cb0ee930611abcd061153a3be2">fold_set_len_</a> = NULL;
164
<a name="l00062"></a>00062 }
165
<a name="l00063"></a>00063 <span class="keywordflow">if</span> (<a class="code" href="a00304.html#ab8e30443f3f9a1d1e9ca5640608a47a8">feat_extract_</a> != NULL) {
166
<a name="l00064"></a>00064 <span class="keyword">delete</span> <a class="code" href="a00304.html#ab8e30443f3f9a1d1e9ca5640608a47a8">feat_extract_</a>;
167
<a name="l00065"></a>00065 <a class="code" href="a00304.html#ab8e30443f3f9a1d1e9ca5640608a47a8">feat_extract_</a> = NULL;
168
<a name="l00066"></a>00066 }
169
<a name="l00067"></a>00067 }
170
<a name="l00068"></a>00068
171
<a name="l00069"></a>00069 <span class="comment">// pure virtual functions that need to be implemented by any inheriting class</span>
172
<a name="l00070"></a>00070 <span class="keyword">virtual</span> <a class="code" href="a00300.html">CharAltList</a> * <a class="code" href="a00304.html#ae133c2172d9bc6ae1726ae9a436755f1">Classify</a>(<a class="code" href="a00306.html">CharSamp</a> *char_samp) = 0;
173
<a name="l00071"></a>00071 <span class="keyword">virtual</span> <span class="keywordtype">int</span> <a class="code" href="a00304.html#aa447f4775f256d36dab382f1bbb7b56c">CharCost</a>(<a class="code" href="a00306.html">CharSamp</a> *char_samp) = 0;
174
<a name="l00072"></a>00072 <span class="keyword">virtual</span> <span class="keywordtype">bool</span> <a class="code" href="a00304.html#a3ee7b00c9999051a92426b6de0bc7e5d">Train</a>(<a class="code" href="a00306.html">CharSamp</a> *char_samp, <span class="keywordtype">int</span> ClassID) = 0;
175
<a name="l00073"></a>00073 <span class="keyword">virtual</span> <span class="keywordtype">bool</span> <a class="code" href="a00304.html#ab2c1ff04d245d64d7900afefae9ef842">SetLearnParam</a>(<span class="keywordtype">char</span> *var_name, <span class="keywordtype">float</span> val) = 0;
176
<a name="l00074"></a>00074 <span class="keyword">virtual</span> <span class="keywordtype">bool</span> <a class="code" href="a00304.html#a64532c78a06560da1fb9ed7d54d9309f">Init</a>(<span class="keyword">const</span> <span class="keywordtype">string</span> &data_file_path, <span class="keyword">const</span> <span class="keywordtype">string</span> &<a class="code" href="a01266.html#a4d02e13fee24fdebbbe98ccdcb9c9279">lang</a>,
177
<a name="l00075"></a>00075 <a class="code" href="a00445.html">LangModel</a> *lang_mod) = 0;
178
<a name="l00076"></a>00076
179
<a name="l00077"></a>00077 <span class="comment">// accessors</span>
180
<a name="l00078"></a><a class="code" href="a00304.html#ae68e84dfd759cb08e82d2cee97abd3b2">00078</a> <a class="code" href="a00381.html">FeatureBase</a> *<a class="code" href="a00304.html#ae68e84dfd759cb08e82d2cee97abd3b2">FeatureExtractor</a>() {<span class="keywordflow">return</span> <a class="code" href="a00304.html#ab8e30443f3f9a1d1e9ca5640608a47a8">feat_extract_</a>;}
181
<a name="l00079"></a><a class="code" href="a00304.html#ac985e2cf1310211262590b0952ab2fa9">00079</a> <span class="keyword">inline</span> <span class="keywordtype">bool</span> <a class="code" href="a00304.html#ac985e2cf1310211262590b0952ab2fa9">CaseSensitive</a>()<span class="keyword"> const </span>{ <span class="keywordflow">return</span> <a class="code" href="a00304.html#aaabb1acf1d7ebcd2b66e1f9796cc49dc">case_sensitive_</a>; }
182
<a name="l00080"></a><a class="code" href="a00304.html#a5480d01debdf57b4d2d2189c2c499e2d">00080</a> <span class="keyword">inline</span> <span class="keywordtype">void</span> <a class="code" href="a00304.html#a5480d01debdf57b4d2d2189c2c499e2d">SetCaseSensitive</a>(<span class="keywordtype">bool</span> case_sensitive) {
183
<a name="l00081"></a>00081 <a class="code" href="a00304.html#aaabb1acf1d7ebcd2b66e1f9796cc49dc">case_sensitive_</a> = case_sensitive;
184
<a name="l00082"></a>00082 }
185
<a name="l00083"></a>00083
186
<a name="l00084"></a>00084 <span class="keyword">protected</span>:
187
<a name="l00085"></a>00085 <span class="keyword">virtual</span> <span class="keywordtype">void</span> <a class="code" href="a00304.html#a38059a0e194a7e1ab1099f15bb0c4a87">Fold</a>() = 0;
188
<a name="l00086"></a>00086 <span class="keyword">virtual</span> <span class="keywordtype">bool</span> <a class="code" href="a00304.html#ada1bba5a3763258805be98302083eb8e">LoadFoldingSets</a>(<span class="keyword">const</span> <span class="keywordtype">string</span> &data_file_path,
189
<a name="l00087"></a>00087 <span class="keyword">const</span> <span class="keywordtype">string</span> &<a class="code" href="a01266.html#a4d02e13fee24fdebbbe98ccdcb9c9279">lang</a>,
190
<a name="l00088"></a>00088 <a class="code" href="a00445.html">LangModel</a> *lang_mod) = 0;
191
<a name="l00089"></a><a class="code" href="a00304.html#ab8e30443f3f9a1d1e9ca5640608a47a8">00089</a> <a class="code" href="a00381.html">FeatureBase</a> *<a class="code" href="a00304.html#ab8e30443f3f9a1d1e9ca5640608a47a8">feat_extract_</a>;
192
<a name="l00090"></a><a class="code" href="a00304.html#afbe25062436573d4a3b8c9e9936f6013">00090</a> <a class="code" href="a00309.html">CharSet</a> *<a class="code" href="a00304.html#afbe25062436573d4a3b8c9e9936f6013">char_set_</a>;
193
<a name="l00091"></a><a class="code" href="a00304.html#af2e7491d921d252957ae0ea4cdaf9aff">00091</a> <a class="code" href="a00634.html">TuningParams</a> *<a class="code" href="a00304.html#af2e7491d921d252957ae0ea4cdaf9aff">params_</a>;
194
<a name="l00092"></a><a class="code" href="a00304.html#ad7acb8330f63320bb636c66d31b815dc">00092</a> <span class="keywordtype">int</span> **<a class="code" href="a00304.html#ad7acb8330f63320bb636c66d31b815dc">fold_sets_</a>;
195
<a name="l00093"></a><a class="code" href="a00304.html#a883ce8cb0ee930611abcd061153a3be2">00093</a> <span class="keywordtype">int</span> *<a class="code" href="a00304.html#a883ce8cb0ee930611abcd061153a3be2">fold_set_len_</a>;
196
<a name="l00094"></a><a class="code" href="a00304.html#aa00adf41e98123f259e463b037908db7">00094</a> <span class="keywordtype">int</span> <a class="code" href="a00304.html#aa00adf41e98123f259e463b037908db7">fold_set_cnt_</a>;
197
<a name="l00095"></a><a class="code" href="a00304.html#ac5b9df929e2570650b263f0a1504125b">00095</a> <span class="keywordtype">bool</span> <a class="code" href="a00304.html#ac5b9df929e2570650b263f0a1504125b">init_</a>;
198
<a name="l00096"></a><a class="code" href="a00304.html#aaabb1acf1d7ebcd2b66e1f9796cc49dc">00096</a> <span class="keywordtype">bool</span> <a class="code" href="a00304.html#aaabb1acf1d7ebcd2b66e1f9796cc49dc">case_sensitive_</a>;
199
<a name="l00097"></a>00097 };
200
<a name="l00098"></a>00098 } <span class="comment">// tesseract</span>
201
<a name="l00099"></a>00099
202
<a name="l00100"></a>00100 <span class="preprocessor">#endif // CHAR_CLASSIFIER_BASE_H</span>
203
</pre></div></div><!-- contents -->
205
<!-- window showing the filter options -->
206
<div id="MSearchSelectWindow"
207
onmouseover="return searchBox.OnSearchSelectShow()"
208
onmouseout="return searchBox.OnSearchSelectHide()"
209
onkeydown="return searchBox.OnSearchSelectKey(event)">
210
<a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(0)"><span class="SelectionMark"> </span>All</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(1)"><span class="SelectionMark"> </span>Classes</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(2)"><span class="SelectionMark"> </span>Namespaces</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(3)"><span class="SelectionMark"> </span>Files</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(4)"><span class="SelectionMark"> </span>Functions</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(5)"><span class="SelectionMark"> </span>Variables</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(6)"><span class="SelectionMark"> </span>Typedefs</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(7)"><span class="SelectionMark"> </span>Enumerations</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(8)"><span class="SelectionMark"> </span>Enumerator</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(9)"><span class="SelectionMark"> </span>Friends</a><a class="SelectItem" href="javascript:void(0)" onclick="searchBox.OnSelectItem(10)"><span class="SelectionMark"> </span>Defines</a></div>
212
<!-- iframe showing the search results (closed by default) -->
213
<div id="MSearchResultsWindow">
214
<iframe src="javascript:void(0)" frameborder="0"
215
name="MSearchResults" id="MSearchResults">
219
<div id="nav-path" class="navpath">
221
<li class="navelem"><a class="el" href="a00972.html">classifier_base.h</a> </li>
223
<li class="footer">Generated on Mon Feb 3 2014 10:59:09 for tesseract by
224
<a href="http://www.doxygen.org/index.html">
225
<img class="footer" src="doxygen.png" alt="doxygen"/></a> 1.7.6.1 </li>