~ubuntu-branches/debian/sid/golang-github-blevesearch-bleve/sid

« back to all changes in this revision

Viewing changes to analysis/token/camelcase/camelcase.go

Committer: Package Import Robot
Author(s): Michael Lustfield
Date: 2017-03-30 16:06:03 UTC
Revision ID: package-import@ubuntu.com-20170330160603-0oogmb960l7918jx

Tags: upstream-0.5.0+git20170324.202.4702785f

Import upstream version 0.5.0+git20170324.202.4702785f

files added:

.travis.yml

CONTRIBUTING.md

LICENSE

README.md

analysis

analysis/analyzer

analysis/analyzer/custom

analysis/analyzer/custom/custom.go

analysis/analyzer/keyword

analysis/analyzer/keyword/keyword.go

analysis/analyzer/simple

analysis/analyzer/simple/simple.go

analysis/analyzer/standard

analysis/analyzer/standard/standard.go

analysis/analyzer/web

analysis/analyzer/web/web.go

analysis/benchmark_test.go

analysis/char

analysis/char/html

analysis/char/html/html.go

analysis/char/regexp

analysis/char/regexp/regexp.go

analysis/char/regexp/regexp_test.go

analysis/char/zerowidthnonjoiner

analysis/char/zerowidthnonjoiner/zerowidthnonjoiner.go

analysis/datetime

analysis/datetime/flexible

analysis/datetime/flexible/flexible.go

analysis/datetime/flexible/flexible_test.go

analysis/datetime/optional

analysis/datetime/optional/optional.go

analysis/freq.go

analysis/freq_test.go

analysis/lang

analysis/lang/ar

analysis/lang/ar/analyzer_ar.go

analysis/lang/ar/analyzer_ar_test.go

analysis/lang/ar/arabic_normalize.go

analysis/lang/ar/arabic_normalize_test.go

analysis/lang/ar/stemmer_ar.go

analysis/lang/ar/stemmer_ar_test.go

analysis/lang/ar/stop_filter_ar.go

analysis/lang/ar/stop_words_ar.go

analysis/lang/bg

analysis/lang/bg/stop_filter_bg.go

analysis/lang/bg/stop_words_bg.go

analysis/lang/ca

analysis/lang/ca/articles_ca.go

analysis/lang/ca/elision_ca.go

analysis/lang/ca/elision_ca_test.go

analysis/lang/ca/stop_filter_ca.go

analysis/lang/ca/stop_words_ca.go

analysis/lang/cjk

analysis/lang/cjk/analyzer_cjk.go

analysis/lang/cjk/analyzer_cjk_test.go

analysis/lang/cjk/cjk_bigram.go

analysis/lang/cjk/cjk_bigram_test.go

analysis/lang/cjk/cjk_width.go

analysis/lang/cjk/cjk_width_test.go

analysis/lang/ckb

analysis/lang/ckb/analyzer_ckb.go

analysis/lang/ckb/analyzer_ckb_test.go

analysis/lang/ckb/sorani_normalize.go

analysis/lang/ckb/sorani_normalize_test.go

analysis/lang/ckb/sorani_stemmer_filter.go

analysis/lang/ckb/sorani_stemmer_filter_test.go

analysis/lang/ckb/stop_filter_ckb.go

analysis/lang/ckb/stop_words_ckb.go

analysis/lang/cs

analysis/lang/cs/stop_filter_cs.go

analysis/lang/cs/stop_words_cs.go

analysis/lang/el

analysis/lang/el/stop_filter_el.go

analysis/lang/el/stop_words_el.go

analysis/lang/en

analysis/lang/en/analyzer_en.go

analysis/lang/en/analyzer_en_test.go

analysis/lang/en/possessive_filter_en.go

analysis/lang/en/possessive_filter_en_test.go

analysis/lang/en/stop_filter_en.go

analysis/lang/en/stop_words_en.go

analysis/lang/eu

analysis/lang/eu/stop_filter_eu.go

analysis/lang/eu/stop_words_eu.go

analysis/lang/fa

analysis/lang/fa/analyzer_fa.go

analysis/lang/fa/analyzer_fa_test.go

analysis/lang/fa/persian_normalize.go

analysis/lang/fa/persian_normalize_test.go

analysis/lang/fa/stop_filter_fa.go

analysis/lang/fa/stop_words_fa.go

analysis/lang/fr

analysis/lang/fr/analyzer_fr.go

analysis/lang/fr/analyzer_fr_test.go

analysis/lang/fr/articles_fr.go

analysis/lang/fr/elision_fr.go

analysis/lang/fr/elision_fr_test.go

analysis/lang/fr/light_stemmer_fr.go

analysis/lang/fr/light_stemmer_fr_test.go

analysis/lang/fr/minimal_stemmer_fr.go

analysis/lang/fr/minimal_stemmer_fr_test.go

analysis/lang/fr/stop_filter_fr.go

analysis/lang/fr/stop_words_fr.go

analysis/lang/ga

analysis/lang/ga/articles_ga.go

analysis/lang/ga/elision_ga.go

analysis/lang/ga/elision_ga_test.go

analysis/lang/ga/stop_filter_ga.go

analysis/lang/ga/stop_words_ga.go

analysis/lang/gl

analysis/lang/gl/stop_filter_gl.go

analysis/lang/gl/stop_words_gl.go

analysis/lang/hi

analysis/lang/hi/analyzer_hi.go

analysis/lang/hi/analyzer_hi_test.go

analysis/lang/hi/hindi_normalize.go

analysis/lang/hi/hindi_normalize_test.go

analysis/lang/hi/hindi_stemmer_filter.go

analysis/lang/hi/hindi_stemmer_filter_test.go

analysis/lang/hi/stop_filter_hi.go

analysis/lang/hi/stop_words_hi.go

analysis/lang/hy

analysis/lang/hy/stop_filter_hy.go

analysis/lang/hy/stop_words_hy.go

analysis/lang/id

analysis/lang/id/stop_filter_id.go

analysis/lang/id/stop_words_id.go

analysis/lang/in

analysis/lang/in/indic_normalize.go

analysis/lang/in/indic_normalize_test.go

analysis/lang/in/scripts.go

analysis/lang/it

analysis/lang/it/analyzer_it.go

analysis/lang/it/analyzer_it_test.go

analysis/lang/it/articles_it.go

analysis/lang/it/elision_it.go

analysis/lang/it/elision_it_test.go

analysis/lang/it/light_stemmer_it.go

analysis/lang/it/light_stemmer_it_test.go

analysis/lang/it/stop_filter_it.go

analysis/lang/it/stop_words_it.go

analysis/lang/pt

analysis/lang/pt/analyzer_pt.go

analysis/lang/pt/analyzer_pt_test.go

analysis/lang/pt/light_stemmer_pt.go

analysis/lang/pt/light_stemmer_pt_test.go

analysis/lang/pt/stop_filter_pt.go

analysis/lang/pt/stop_words_pt.go

analysis/test_words.txt

analysis/token

analysis/token/apostrophe

analysis/token/apostrophe/apostrophe.go

analysis/token/apostrophe/apostrophe_test.go

analysis/token/camelcase

analysis/token/camelcase/camelcase.go

analysis/token/camelcase/camelcase_test.go

analysis/token/camelcase/parser.go

analysis/token/camelcase/states.go

analysis/token/compound

analysis/token/compound/dict.go

analysis/token/compound/dict_test.go

analysis/token/edgengram

analysis/token/edgengram/edgengram.go

analysis/token/edgengram/edgengram_test.go

analysis/token/elision

analysis/token/elision/elision.go

analysis/token/elision/elision_test.go

analysis/token/keyword

analysis/token/keyword/keyword.go

analysis/token/keyword/keyword_test.go

analysis/token/length

analysis/token/length/length.go

analysis/token/length/length_test.go

analysis/token/lowercase

analysis/token/lowercase/lowercase.go

analysis/token/lowercase/lowercase_test.go

analysis/token/ngram

analysis/token/ngram/ngram.go

analysis/token/ngram/ngram_test.go

analysis/token/porter

analysis/token/porter/porter.go

analysis/token/porter/porter_test.go

analysis/token/shingle

analysis/token/shingle/shingle.go

analysis/token/shingle/shingle_test.go

analysis/token/stop

analysis/token/stop/stop.go

analysis/token/stop/stop_test.go

analysis/token/truncate

analysis/token/truncate/truncate.go

analysis/token/truncate/truncate_test.go

analysis/token/unicodenorm

analysis/token/unicodenorm/unicodenorm.go

analysis/token/unicodenorm/unicodenorm_test.go

analysis/tokenizer

analysis/tokenizer/character

analysis/tokenizer/character/character.go

analysis/tokenizer/character/character_test.go

analysis/tokenizer/exception

analysis/tokenizer/exception/exception.go

analysis/tokenizer/exception/exception_test.go

analysis/tokenizer/letter

analysis/tokenizer/letter/letter.go

analysis/tokenizer/regexp

analysis/tokenizer/regexp/regexp.go

analysis/tokenizer/regexp/regexp_test.go

analysis/tokenizer/single

analysis/tokenizer/single/single.go

analysis/tokenizer/single/single_test.go

analysis/tokenizer/unicode

analysis/tokenizer/unicode/unicode.go

analysis/tokenizer/unicode/unicode_test.go

analysis/tokenizer/web

analysis/tokenizer/web/web.go

analysis/tokenizer/web/web_test.go

analysis/tokenizer/whitespace

analysis/tokenizer/whitespace/whitespace.go

analysis/tokenizer/whitespace/whitespace_test.go

analysis/tokenmap

analysis/tokenmap.go

analysis/tokenmap/custom.go

analysis/tokenmap_test.go

analysis/type.go

analysis/util.go

analysis/util_test.go

cmd/bleve

cmd/bleve/cmd

cmd/bleve/cmd/bulk.go

cmd/bleve/cmd/check.go

cmd/bleve/cmd/count.go

cmd/bleve/cmd/create.go

cmd/bleve/cmd/dictionary.go

cmd/bleve/cmd/dump.go

cmd/bleve/cmd/dumpDoc.go

cmd/bleve/cmd/dumpFields.go

cmd/bleve/cmd/fields.go

cmd/bleve/cmd/index.go

cmd/bleve/cmd/mapping.go

cmd/bleve/cmd/query.go

cmd/bleve/cmd/registry.go

cmd/bleve/cmd/root.go

cmd/bleve/gendocs.go

cmd/bleve/main.go

config

config.go

config/README.md

config/config.go

config/config_cld2.go

config/config_cznicb.go

config/config_forestdb.go

config/config_icu.go

config/config_kagome.go

config/config_leveldb.go

config/config_libstemmer.go

config/config_rocksdb.go

config_app.go

config_disk.go

doc.go

docs

docs/bleve.png

docs/build_children.sh

docs/merge-coverprofile.go

docs/old_build_script.txt

docs/project-code-coverage.sh

document

document/document.go

document/document_test.go

document/field.go

document/field_boolean.go

document/field_composite.go

document/field_datetime.go

document/field_numeric.go

document/field_numeric_test.go

document/field_text.go

document/indexing_options.go

document/indexing_options_test.go

error.go

examples_test.go

http

http/alias.go

http/debug.go

http/doc_count.go

http/doc_delete.go

http/doc_get.go

http/doc_index.go

http/fields.go

http/handlers_test.go

http/index_create.go

http/index_delete.go

http/index_get.go

http/index_list.go

http/registry.go

http/search.go

http/util.go

index

index.go

index/analysis.go

index/field_cache.go

index/index.go

index/store

index/store/batch.go

index/store/boltdb

index/store/boltdb/iterator.go

index/store/boltdb/reader.go

index/store/boltdb/stats.go

index/store/boltdb/store.go

index/store/boltdb/store_test.go

index/store/boltdb/writer.go

index/store/goleveldb

index/store/goleveldb/batch.go

index/store/goleveldb/config.go

index/store/goleveldb/iterator.go

index/store/goleveldb/reader.go

index/store/goleveldb/store.go

index/store/goleveldb/store_test.go

index/store/goleveldb/writer.go

index/store/gtreap

index/store/gtreap/iterator.go

index/store/gtreap/reader.go

index/store/gtreap/store.go

index/store/gtreap/store_test.go

index/store/gtreap/writer.go

index/store/kvstore.go

index/store/merge.go

index/store/metrics

index/store/metrics/batch.go

index/store/metrics/iterator.go

index/store/metrics/metrics_test.go

index/store/metrics/reader.go

index/store/metrics/stats.go

index/store/metrics/store.go

index/store/metrics/store_test.go

index/store/metrics/util.go

index/store/metrics/writer.go

index/store/moss

index/store/moss/batch.go

index/store/moss/iterator.go

index/store/moss/lower.go

index/store/moss/lower_test.go

index/store/moss/reader.go

index/store/moss/stats.go

index/store/moss/store.go

index/store/moss/store_test.go

index/store/moss/writer.go

index/store/multiget.go

index/store/null

index/store/null/null.go

index/store/null/null_test.go

index/store/test

index/store/test/README.md

index/store/test/bytes.go

index/store/test/crud.go

index/store/test/isolation.go

index/store/test/iterator.go

index/store/test/merge.go

index/upsidedown

index/upsidedown/analysis.go

index/upsidedown/analysis_test.go

index/upsidedown/benchmark_all.sh

index/upsidedown/benchmark_boltdb_test.go

index/upsidedown/benchmark_common_test.go

index/upsidedown/benchmark_cznicb_test.go

index/upsidedown/benchmark_forestdb_test.go

index/upsidedown/benchmark_goleveldb_test.go

index/upsidedown/benchmark_gorocksdb_test.go

index/upsidedown/benchmark_gtreap_test.go

index/upsidedown/benchmark_leveldb_test.go

index/upsidedown/benchmark_null_test.go

index/upsidedown/dump.go

index/upsidedown/dump_test.go

index/upsidedown/field_dict.go

index/upsidedown/field_dict_test.go

index/upsidedown/index_reader.go

index/upsidedown/reader.go

index/upsidedown/reader_test.go

index/upsidedown/row.go

index/upsidedown/row_merge.go

index/upsidedown/row_merge_test.go

index/upsidedown/row_test.go

index/upsidedown/stats.go

index/upsidedown/upsidedown.go

index/upsidedown/upsidedown.pb.go

index/upsidedown/upsidedown.proto

index/upsidedown/upsidedown_test.go

index_alias.go

index_alias_impl.go

index_alias_impl_test.go

index_impl.go

index_meta.go

index_meta_test.go

index_stats.go

index_test.go

mapping

mapping.go

mapping/analysis.go

mapping/document.go

mapping/examples_test.go

mapping/field.go

mapping/index.go

mapping/mapping.go

mapping/mapping_test.go

mapping/reflect.go

mapping/reflect_test.go

numeric

numeric/float.go

numeric/float_test.go

numeric/prefix_coded.go

numeric/prefix_coded_test.go

query.go

registry

registry/analyzer.go

registry/cache.go

registry/char_filter.go

registry/datetime_parser.go

registry/fragment_formatter.go

registry/fragmenter.go

registry/highlighter.go

registry/index_type.go

registry/registry.go

registry/store.go

registry/token_filter.go

registry/token_maps.go

registry/tokenizer.go

search.go

search/collector

search/collector.go

search/collector/bench_test.go

search/collector/heap.go

search/collector/list.go

search/collector/search_test.go

search/collector/slice.go

search/collector/topn.go

search/collector/topn_test.go

search/explanation.go

search/facet

search/facet/benchmark_data.txt

search/facet/facet_builder_datetime.go

search/facet/facet_builder_numeric.go

search/facet/facet_builder_numeric_test.go

search/facet/facet_builder_terms.go

search/facet/facet_builder_terms_test.go

search/facets_builder.go

search/facets_builder_test.go

search/highlight

search/highlight/format

search/highlight/format/ansi

search/highlight/format/ansi/ansi.go

search/highlight/format/html

search/highlight/format/html/html.go

search/highlight/format/html/html_test.go

search/highlight/fragmenter

search/highlight/fragmenter/simple

search/highlight/fragmenter/simple/simple.go

search/highlight/fragmenter/simple/simple_test.go

search/highlight/highlighter

search/highlight/highlighter.go

search/highlight/highlighter/ansi

search/highlight/highlighter/ansi/ansi.go

search/highlight/highlighter/html

search/highlight/highlighter/html/html.go

search/highlight/highlighter/simple

search/highlight/highlighter/simple/fragment_scorer_simple.go

search/highlight/highlighter/simple/fragment_scorer_simple_test.go

search/highlight/highlighter/simple/highlighter_simple.go

search/highlight/highlighter/simple/highlighter_simple_test.go

search/highlight/term_locations.go

search/highlight/term_locations_test.go

search/levenshtein.go

search/levenshtein_test.go

search/pool.go

search/pool_test.go

search/query

search/query/bool_field.go

search/query/boolean.go

search/query/boost.go

search/query/conjunction.go

search/query/date_range.go

search/query/date_range_test.go

search/query/disjunction.go

search/query/docid.go

search/query/fuzzy.go

search/query/match.go

search/query/match_all.go

search/query/match_none.go

search/query/match_phrase.go

search/query/match_phrase_test.go

search/query/multi_phrase.go

search/query/numeric_range.go

search/query/phrase.go

search/query/prefix.go

search/query/query.go

search/query/query_string.go

search/query/query_string.y

search/query/query_string.y.go

search/query/query_string_lex.go

search/query/query_string_parser.go

search/query/query_string_parser_test.go

search/query/query_test.go

search/query/regexp.go

search/query/term.go

search/query/wildcard.go

search/scorer

search/scorer/scorer_conjunction.go

search/scorer/scorer_constant.go

search/scorer/scorer_constant_test.go

search/scorer/scorer_disjunction.go

search/scorer/scorer_term.go

search/scorer/scorer_term_test.go

search/scorer/sqrt_cache.go

search/search.go

search/searcher

search/searcher/base_test.go

search/searcher/ordered_searchers_list.go

search/searcher/search_boolean.go

search/searcher/search_boolean_test.go

search/searcher/search_conjunction.go

search/searcher/search_conjunction_test.go

search/searcher/search_disjunction.go

search/searcher/search_disjunction_test.go

search/searcher/search_docid.go

search/searcher/search_docid_test.go

search/searcher/search_fuzzy.go

search/searcher/search_fuzzy_test.go

search/searcher/search_match_all.go

search/searcher/search_match_all_test.go

search/searcher/search_match_none.go

search/searcher/search_match_none_test.go

search/searcher/search_numeric_range.go

search/searcher/search_numeric_range_test.go

search/searcher/search_phrase.go

search/searcher/search_phrase_test.go

search/searcher/search_regexp.go

search/searcher/search_regexp_test.go

search/searcher/search_term.go

search/searcher/search_term_prefix.go

search/searcher/search_term_test.go

search/sort.go

search/util.go

search/util_test.go

search_test.go

test

test/integration.go

test/integration_test.go

test/tests

test/tests/basic

test/tests/basic/data

test/tests/basic/data/a.json

test/tests/basic/data/b.json

test/tests/basic/data/c.json

test/tests/basic/data/d.json

test/tests/basic/mapping.json

test/tests/basic/searches.json

test/tests/employee

test/tests/employee/data

test/tests/employee/data/emp10508560.json

test/tests/employee/mapping.json

test/tests/employee/searches.json

test/tests/facet

test/tests/facet/data

test/tests/facet/data/a.json

test/tests/facet/data/b.json

test/tests/facet/data/c.json

test/tests/facet/data/d.json

test/tests/facet/data/e.json

test/tests/facet/data/f.json

test/tests/facet/data/g.json

test/tests/facet/data/h.json

test/tests/facet/data/i.json

test/tests/facet/data/j.json

test/tests/facet/mapping.json

test/tests/facet/searches.json

test/tests/fosdem

test/tests/fosdem/data

test/tests/fosdem/data/3311@FOSDEM15@fosdem.org.json

test/tests/fosdem/data/3492@FOSDEM15@fosdem.org.json

test/tests/fosdem/data/3496@FOSDEM15@fosdem.org.json

test/tests/fosdem/data/3505@FOSDEM15@fosdem.org.json

test/tests/fosdem/data/3507@FOSDEM15@fosdem.org.json

test/tests/fosdem/mapping.json

test/tests/fosdem/searches.json

test/tests/phrase

test/tests/phrase/data

test/tests/phrase/data/a.json

test/tests/phrase/data/b.json

test/tests/phrase/mapping.json

test/tests/phrase/searches.json

test/tests/sort

test/tests/sort/data

test/tests/sort/data/a.json

test/tests/sort/data/b.json

test/tests/sort/data/c.json

test/tests/sort/data/d.json

test/tests/sort/data/e.json

test/tests/sort/data/f.json

test/tests/sort/mapping.json

test/tests/sort/searches.json

Show diffs side-by-side

added added

removed removed

analysis/token/camelcase/camelcase.go

// Licensed under the Apache License, Version 2.0 (the "License");

// you may not use this file except in compliance with the License.

// You may obtain a copy of the License at

// http://www.apache.org/licenses/LICENSE-2.0

// Unless required by applicable law or agreed to in writing, software

// distributed under the License is distributed on an "AS IS" BASIS,

// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

// See the License for the specific language governing permissions and

// limitations under the License.

package camelcase

import (

"bytes"

"unicode/utf8"

"github.com/blevesearch/bleve/analysis"

"github.com/blevesearch/bleve/registry"

)

const Name = "camelCase"

// CamelCaseFilter splits a given token into a set of tokens where each resulting token

// falls into one the following classes:

// 1) Upper case followed by lower case letters.

// Terminated by a number, an upper case letter, and a non alpha-numeric symbol.

// 2) Upper case followed by upper case letters.

// Terminated by a number, an upper case followed by a lower case letter, and a non alpha-numeric symbol.

// 3) Lower case followed by lower case letters.

// Terminated by a number, an upper case letter, and a non alpha-numeric symbol.

// 4) Number followed by numbers.

// Terminated by a letter, and a non alpha-numeric symbol.

// 5) Non alpha-numeric symbol followed by non alpha-numeric symbols.

// Terminated by a number, and a letter.

// It does a one-time sequential pass over an input token, from left to right.

// The scan is greedy and generates the longest substring that fits into one of the classes.

// See the test file for examples of classes and their parsings.

type CamelCaseFilter struct{}

func NewCamelCaseFilter() *CamelCaseFilter {

return &CamelCaseFilter{}

}

func (f *CamelCaseFilter) Filter(input analysis.TokenStream) analysis.TokenStream {

rv := make(analysis.TokenStream, 0, len(input))

for _, token := range input {

runeCount := utf8.RuneCount(token.Term)

runes := bytes.Runes(token.Term)

p := NewParser(runeCount)

for i := 0; i < runeCount; i++ {

if i+1 >= runeCount {

p.Push(runes[i], nil)

} else {

p.Push(runes[i], &runes[i+1])

}

rv = append(rv, p.FlushTokens()...)

}

return rv

}

func CamelCaseFilterConstructor(config map[string]interface{}, cache *registry.Cache) (analysis.TokenFilter, error) {

return NewCamelCaseFilter(), nil

}

func init() {

registry.RegisterTokenFilter(Name, CamelCaseFilterConstructor)

}

Older »