2
2
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS HEADER.
4
4
* Copyright (c) 2007 Sun Microsystems, Inc. All Rights Reserved.
6
6
* The contents of this file are subject to the terms of either the GNU Lesser
7
7
* General Public License Version 2.1 only ("LGPL") or the Common Development and
8
8
* Distribution License ("CDDL")(collectively, the "License"). You may not use this
9
9
* file except in compliance with the License. You can obtain a copy of the CDDL at
10
10
* http://www.opensource.org/licenses/cddl1.php and a copy of the LGPLv2.1 at
11
* http://www.opensource.org/licenses/lgpl-license.php. See the License for the
11
* http://www.opensource.org/licenses/lgpl-license.php. See the License for the
12
12
* specific language governing permissions and limitations under the License. When
13
13
* distributing the software, include this License Header Notice in each file and
14
14
* include the full text of the License in the License file as well as the
15
15
* following notice:
17
17
* NOTICE PURSUANT TO SECTION 9 OF THE COMMON DEVELOPMENT AND DISTRIBUTION LICENSE
19
19
* For Covered Software in this distribution, this License shall be governed by the
21
21
* Any litigation relating to this License shall be subject to the jurisdiction of
22
22
* the Federal Courts of the Northern District of California and the state courts
23
23
* of the State of California, with venue lying in Santa Clara County, California.
27
27
* If you wish your version of this file to be governed by only the CDDL or only
28
28
* the LGPL Version 2.1, indicate your decision by adding "[Contributor]" elects to
29
29
* include this software in this distribution under the [CDDL or LGPL Version 2.1]
32
32
* Version 2.1, or to extend the choice of license to its licensees as provided
33
33
* above. However, if you add LGPL Version 2.1 code and therefore, elected the LGPL
34
34
* Version 2 license, then the option applies only if the new code is made subject
35
* to such option by the copyright holder.
35
* to such option by the copyright holder.
38
38
#ifndef _SIM_SENTENCIZER_H
46
46
class CSIMCharReader;
48
class SIMCharReaderIterator{
48
class SIMCharReaderIterator {
50
SIMCharReaderIterator(CSIMCharReader* the_reader=NULL, int the_idx = 0)
51
: reader(the_reader), idx(the_idx) { }
52
SIMCharReaderIterator& operator++();
53
SIMCharReaderIterator operator+(int i);
54
TWCHAR & operator*() const;
50
SIMCharReaderIterator(CSIMCharReader* the_reader = NULL, int the_idx = 0)
51
: reader(the_reader), idx(the_idx) { }
52
SIMCharReaderIterator& operator++();
53
SIMCharReaderIterator operator+(int i);
54
TWCHAR & operator*() const;
58
CSIMCharReader* reader;
57
CSIMCharReader* reader;
61
61
class CSIMCharReader {
62
friend class SIMCharReaderIterator;
65
typedef SIMCharReaderIterator iterator;
68
CSIMCharReader(FILE* afp) : fp(afp), buf() { }
69
iterator begin() { return iterator(this, 0); }
62
friend class SIMCharReaderIterator;
65
typedef SIMCharReaderIterator iterator;
68
CSIMCharReader(FILE* afp) : fp(afp), buf() { }
69
iterator begin() { return iterator(this, 0); }
73
std::deque<TWCHAR> buf;
73
std::deque<TWCHAR> buf;
76
76
template <class iterator>
77
bool ReadSentence(wstring& wstr, iterator& first, bool bIgnoreCRLF=false)
77
bool ReadSentence(wstring& wstr, iterator& first, bool bIgnoreCRLF = false){
80
79
TWCHAR ch, chnext, ch2;
82
for (; (ch=*first) != WCH_NULL; ++first) {
81
for (; (ch = *first) != WCH_NULL; ++first) {
82
chnext = *(first + 1);
85
84
if ((ch == WCH_RETURN) && bIgnoreCRLF && (chnext != WCH_RETURN))
87
86
if (ch == WCH_JUHAO || ch == WCH_WENHAO || ch == WCH_TANHAO ||
88
ch == WCH_TANHAO || ch == WCH_SHENGLUEHAO)
87
ch == WCH_TANHAO || ch == WCH_SHENGLUEHAO)
90
89
else if (ch == WCH_DOUHAO && chnext == WCH_DOUHAO)