1
package org.apache.lucene.analysis;
4
* Licensed to the Apache Software Foundation (ASF) under one or more
5
* contributor license agreements. See the NOTICE file distributed with
6
* this work for additional information regarding copyright ownership.
7
* The ASF licenses this file to You under the Apache License, Version 2.0
8
* (the "License"); you may not use this file except in compliance with
9
* the License. You may obtain a copy of the License at
11
* http://www.apache.org/licenses/LICENSE-2.0
13
* Unless required by applicable law or agreed to in writing, software
14
* distributed under the License is distributed on an "AS IS" BASIS,
15
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
16
* See the License for the specific language governing permissions and
17
* limitations under the License.
20
import org.apache.lucene.analysis.tokenattributes.CharTermAttribute;
21
import java.io.StringReader;
23
public class TestISOLatin1AccentFilter extends BaseTokenStreamTestCase {
24
public void testU() throws Exception {
25
TokenStream stream = new WhitespaceTokenizer(TEST_VERSION_CURRENT, new StringReader("Des mot clés À LA CHAÎNE À Á Â Ã Ä Å Æ Ç È É Ê Ë Ì Í Î Ï IJ Ð Ñ Ò Ó Ô Õ Ö Ø Œ Þ Ù Ú Û Ü Ý Ÿ à á â ã ä å æ ç è é ê ë ì í î ï ij ð ñ ò ó ô õ ö ø œ ß þ ù ú û ü ý ÿ fi fl"));
26
ISOLatin1AccentFilter filter = new ISOLatin1AccentFilter(stream);
27
CharTermAttribute termAtt = filter.getAttribute(CharTermAttribute.class);
28
assertTermEquals("Des", filter, termAtt);
29
assertTermEquals("mot", filter, termAtt);
30
assertTermEquals("cles", filter, termAtt);
31
assertTermEquals("A", filter, termAtt);
32
assertTermEquals("LA", filter, termAtt);
33
assertTermEquals("CHAINE", filter, termAtt);
34
assertTermEquals("A", filter, termAtt);
35
assertTermEquals("A", filter, termAtt);
36
assertTermEquals("A", filter, termAtt);
37
assertTermEquals("A", filter, termAtt);
38
assertTermEquals("A", filter, termAtt);
39
assertTermEquals("A", filter, termAtt);
40
assertTermEquals("AE", filter, termAtt);
41
assertTermEquals("C", filter, termAtt);
42
assertTermEquals("E", filter, termAtt);
43
assertTermEquals("E", filter, termAtt);
44
assertTermEquals("E", filter, termAtt);
45
assertTermEquals("E", filter, termAtt);
46
assertTermEquals("I", filter, termAtt);
47
assertTermEquals("I", filter, termAtt);
48
assertTermEquals("I", filter, termAtt);
49
assertTermEquals("I", filter, termAtt);
50
assertTermEquals("IJ", filter, termAtt);
51
assertTermEquals("D", filter, termAtt);
52
assertTermEquals("N", filter, termAtt);
53
assertTermEquals("O", filter, termAtt);
54
assertTermEquals("O", filter, termAtt);
55
assertTermEquals("O", filter, termAtt);
56
assertTermEquals("O", filter, termAtt);
57
assertTermEquals("O", filter, termAtt);
58
assertTermEquals("O", filter, termAtt);
59
assertTermEquals("OE", filter, termAtt);
60
assertTermEquals("TH", filter, termAtt);
61
assertTermEquals("U", filter, termAtt);
62
assertTermEquals("U", filter, termAtt);
63
assertTermEquals("U", filter, termAtt);
64
assertTermEquals("U", filter, termAtt);
65
assertTermEquals("Y", filter, termAtt);
66
assertTermEquals("Y", filter, termAtt);
67
assertTermEquals("a", filter, termAtt);
68
assertTermEquals("a", filter, termAtt);
69
assertTermEquals("a", filter, termAtt);
70
assertTermEquals("a", filter, termAtt);
71
assertTermEquals("a", filter, termAtt);
72
assertTermEquals("a", filter, termAtt);
73
assertTermEquals("ae", filter, termAtt);
74
assertTermEquals("c", filter, termAtt);
75
assertTermEquals("e", filter, termAtt);
76
assertTermEquals("e", filter, termAtt);
77
assertTermEquals("e", filter, termAtt);
78
assertTermEquals("e", filter, termAtt);
79
assertTermEquals("i", filter, termAtt);
80
assertTermEquals("i", filter, termAtt);
81
assertTermEquals("i", filter, termAtt);
82
assertTermEquals("i", filter, termAtt);
83
assertTermEquals("ij", filter, termAtt);
84
assertTermEquals("d", filter, termAtt);
85
assertTermEquals("n", filter, termAtt);
86
assertTermEquals("o", filter, termAtt);
87
assertTermEquals("o", filter, termAtt);
88
assertTermEquals("o", filter, termAtt);
89
assertTermEquals("o", filter, termAtt);
90
assertTermEquals("o", filter, termAtt);
91
assertTermEquals("o", filter, termAtt);
92
assertTermEquals("oe", filter, termAtt);
93
assertTermEquals("ss", filter, termAtt);
94
assertTermEquals("th", filter, termAtt);
95
assertTermEquals("u", filter, termAtt);
96
assertTermEquals("u", filter, termAtt);
97
assertTermEquals("u", filter, termAtt);
98
assertTermEquals("u", filter, termAtt);
99
assertTermEquals("y", filter, termAtt);
100
assertTermEquals("y", filter, termAtt);
101
assertTermEquals("fi", filter, termAtt);
102
assertTermEquals("fl", filter, termAtt);
103
assertFalse(filter.incrementToken());
106
void assertTermEquals(String expected, TokenStream stream, CharTermAttribute termAtt) throws Exception {
107
assertTrue(stream.incrementToken());
108
assertEquals(expected, termAtt.toString());