0
0

move elision filter after lowercase filter

this affects all languages using the elision filter
languages fr and it are updated now
languages ca and ga are still missing other components and
do not yet have an analyzer, but they should follow this lead
once they are ready

fixes #218
This commit is contained in:
Marty Schoch 2015-07-21 10:43:53 -04:00
parent 2a8f319689
commit 1f4ef3da8b
3 changed files with 11 additions and 2 deletions

View File

@ -43,8 +43,8 @@ func AnalyzerConstructor(config map[string]interface{}, cache *registry.Cache) (
rv := analysis.Analyzer{
Tokenizer: tokenizer,
TokenFilters: []analysis.TokenFilter{
elisionFilter,
toLowerFilter,
elisionFilter,
stopFrFilter,
stemmerFrFilter,
},

View File

@ -43,8 +43,8 @@ func AnalyzerConstructor(config map[string]interface{}, cache *registry.Cache) (
rv := analysis.Analyzer{
Tokenizer: tokenizer,
TokenFilters: []analysis.TokenFilter{
elisionFilter,
toLowerFilter,
elisionFilter,
stopItFilter,
stemmerItFilter,
},

View File

@ -61,6 +61,15 @@ func TestItalianAnalyzer(t *testing.T) {
},
},
},
// test for bug #218
{
input: []byte("Nell'anfora"),
output: analysis.TokenStream{
&analysis.Token{
Term: []byte("anfor"),
},
},
},
}
cache := registry.NewCache()