~ubuntu-branches/ubuntu/vivid/icu4j-4.4/vivid

while (m_optionarg_ < optionend && (UCharacter.isWhitespace(rules.charAt(m_optionarg_)) || UCharacterProperty.isRuleWhiteSpace(rules.charAt(m_optionarg_))))

1894

{ // eat whitespace

1895

m_optionarg_ ++;

1896

}

1897

}

1898

break;

1899

}

1900

i ++;

1901

}

1902

if(i == RULES_OPTIONS_.length) {

1903

i = -1;

1904

}

1905

return i;

1906

}

1907

/**

1908

* Reads and set collation options

1909

* @return TOKEN_SUCCESS if option is set correct, 0 otherwise

1910

* @exception ParseException thrown when options in rules are wrong

1911

1912

private byte readAndSetOption() throws ParseException

1913

{

1914

int start = m_current_ + 1; // skip opening '['

1915

int i = readOption(m_rules_, start, m_optionEnd_);

1916

1917

int optionarg = m_optionarg_;

1918

1919

if (i < 0) {

1920

throwParseException(m_rules_, start);

1921

}

1922

1923

if (i < 7) {

1924

if (optionarg != 0) {

1925

for (int j = 0; j < RULES_OPTIONS_[i].m_subOptions_.length;

1926

j ++) {

1927

String subname = RULES_OPTIONS_[i].m_subOptions_[j];

1928

int size = optionarg + subname.length();

1929

if (m_rules_.length() > size

1930

&& subname.equalsIgnoreCase(m_rules_.substring(

1931

optionarg, size))) {

1932

setOptions(m_options_, RULES_OPTIONS_[i].m_attribute_,

1933

RULES_OPTIONS_[i].m_subOptionAttributeValues_[j]);

1934

return TOKEN_SUCCESS_MASK_;

1935

}

1936

}

1937

}

1938

throwParseException(m_rules_, optionarg);

1939

}

1940

else if (i == 7) { // variable top

1941

return TOKEN_SUCCESS_MASK_ | TOKEN_VARIABLE_TOP_MASK_;

1942

}

1943

else if (i == 8) { // rearange

1944

return TOKEN_SUCCESS_MASK_;

1945

}

1946

else if (i == 9) { // before

1947

if (optionarg != 0) {

1948

for (int j = 0; j < RULES_OPTIONS_[i].m_subOptions_.length;

1949

j ++) {

1950

String subname = RULES_OPTIONS_[i].m_subOptions_[j];

1951

int size = optionarg + subname.length();

1952

if (m_rules_.length() > size

1953

&& subname.equalsIgnoreCase(

1954

m_rules_.substring(optionarg,

1955

optionarg + subname.length()))) {

1956

return (byte)(TOKEN_SUCCESS_MASK_

1957

| RULES_OPTIONS_[i].m_subOptionAttributeValues_[j]

1958

+ 1);

1959

}

1960

}

1961

}

1962

throwParseException(m_rules_, optionarg);

1963

}

1964

else if (i == 10) { // top, we are going to have an array with

1965

// structures of limit CEs index to this array will be

1966

// src->parsedToken.indirectIndex

1967

m_parsedToken_.m_indirectIndex_ = 0;

1968

return TOKEN_SUCCESS_MASK_ | TOKEN_TOP_MASK_;

1969

}

1970

else if (i < 13) { // first, last

1971

for (int j = 0; j < RULES_OPTIONS_[i].m_subOptions_.length; j ++) {

1972

String subname = RULES_OPTIONS_[i].m_subOptions_[j];

1973

int size = optionarg + subname.length();

1974

if (m_rules_.length() > size

1975

&& subname.equalsIgnoreCase(m_rules_.substring(optionarg,

1976

size))) {

1977

m_parsedToken_.m_indirectIndex_ = (char)(i - 10 + (j << 1));

1978

return TOKEN_SUCCESS_MASK_ | TOKEN_TOP_MASK_;

1979

}

1980

}

1981

throwParseException(m_rules_, optionarg);

1982

}

1983

else if(i == 13 || i == 14) { // copy and remove are handled before normalization

1984

// we need to move end here

1985

int noOpenBraces = 1;

1986

m_current_++; // skip opening brace

1987

while(m_current_ < m_source_.length() && noOpenBraces != 0) {

1988

if(m_source_.charAt(m_current_) == '[') {

1989

noOpenBraces++;

1990

} else if(m_source_.charAt(m_current_) == ']') { // closing brace

1991

noOpenBraces--;

1992

}

1993

m_current_++;

1994

}

1995

m_optionEnd_ = m_current_-1;

1996

return TOKEN_SUCCESS_MASK_;

1997

}

1998

else {

1999

throwParseException(m_rules_, optionarg);

2000

}

2001

return TOKEN_SUCCESS_MASK_; // we will never reach here.

2002

}

2003

2004

/**

2005

* Set collation option

2006

* @param optionset option set to set

2007

* @param attribute type to set

2008

* @param value attribute value

2009

2010

private void setOptions(OptionSet optionset, int attribute, int value)

2011

{

2012

switch (attribute) {

2013

case RuleBasedCollator.Attribute.HIRAGANA_QUATERNARY_MODE_ :

2014

optionset.m_isHiragana4_

2015

= (value == RuleBasedCollator.AttributeValue.ON_);

2016

break;

2017

case RuleBasedCollator.Attribute.FRENCH_COLLATION_ :

2018

optionset.m_isFrenchCollation_

2019

= (value == RuleBasedCollator.AttributeValue.ON_);

2020

break;

2021

case RuleBasedCollator.Attribute.ALTERNATE_HANDLING_ :

2022

optionset.m_isAlternateHandlingShifted_

2023

= (value

2024

== RuleBasedCollator.AttributeValue.SHIFTED_);

2025

break;

2026

case RuleBasedCollator.Attribute.CASE_FIRST_ :

2027

optionset.m_caseFirst_ = value;

2028

break;

2029

case RuleBasedCollator.Attribute.CASE_LEVEL_ :

2030

optionset.m_isCaseLevel_

2031

= (value == RuleBasedCollator.AttributeValue.ON_);

2032

break;

2033

case RuleBasedCollator.Attribute.NORMALIZATION_MODE_ :

2034

if (value == RuleBasedCollator.AttributeValue.ON_) {

2035

value = Collator.CANONICAL_DECOMPOSITION;

2036

}

2037

optionset.m_decomposition_ = value;

2038

break;

2039

case RuleBasedCollator.Attribute.STRENGTH_ :

2040

optionset.m_strength_ = value;

2041

break;

2042

default :

2043

break;

2044

}

2045

}

2046

2047

UnicodeSet getTailoredSet() throws ParseException

2048

{

2049

boolean startOfRules = true;

2050

UnicodeSet tailored = new UnicodeSet();

2051

String pattern;

2052

CanonicalIterator it = new CanonicalIterator("");

2053

2054

m_parsedToken_.m_strength_ = TOKEN_UNSET_;

2055

int sourcelimit = m_source_.length();

2056

//int expandNext = 0;

2057

2058

while (m_current_ < sourcelimit) {

2059

m_parsedToken_.m_prefixOffset_ = 0;

2060

if (parseNextToken(startOfRules) < 0) {

2061

// we have reached the end

2062

continue;

2063

}

2064

startOfRules = false;

2065

// The idea is to tokenize the rule set. For each non-reset token,

2066

// we add all the canonicaly equivalent FCD sequences

2067

if(m_parsedToken_.m_strength_ != TOKEN_RESET_) {

2068

it.setSource(m_source_.substring(

2069

m_parsedToken_.m_charsOffset_,

2070

m_parsedToken_.m_charsOffset_+m_parsedToken_.m_charsLen_));

2071

pattern = it.next();

2072

while(pattern != null) {

2073

if(Normalizer.quickCheck(pattern, Normalizer.FCD,0) != Normalizer.NO) {

2074

tailored.add(pattern);

2075

}

2076

pattern = it.next();

2077

}

2078

}

2079

}

2080

return tailored;

2081

}

2082

2083

final private void extractSetsFromRules(String rules) throws ParseException {

2084

int optionNumber = -1;

2085

int setStart = 0;

2086

int i = 0;

2087

while(i < rules.length()) {

2088

if(rules.charAt(i) == 0x005B) {

2089

optionNumber = readOption(rules, i+1, rules.length());

2090

setStart = m_optionarg_;

2091

if(optionNumber == 13) { /* copy - parts of UCA to tailoring */

2092

UnicodeSet newSet = readAndSetUnicodeSet(rules, setStart);

2093

if(m_copySet_ == null) {

2094

m_copySet_ = newSet;

2095

} else {

2096

m_copySet_.addAll(newSet);

2097

}

2098

} else if(optionNumber == 14) {

2099

UnicodeSet newSet = readAndSetUnicodeSet(rules, setStart);

2100

if(m_removeSet_ == null) {

2101

m_removeSet_ = newSet;

2102

} else {

2103

m_removeSet_.addAll(newSet);

2104

}

2105

}

2106

}

2107

i++;

2108

}

2109

}

2110

}

Older »