move elision filter after lowercase filter
this affects all languages using the elision filter languages fr and it are updated now languages ca and ga are still missing other components and do not yet have an analyzer, but they should follow this lead once they are ready fixes #218
This commit is contained in:
parent
2a8f319689
commit
1f4ef3da8b
|
@ -43,8 +43,8 @@ func AnalyzerConstructor(config map[string]interface{}, cache *registry.Cache) (
|
|||
rv := analysis.Analyzer{
|
||||
Tokenizer: tokenizer,
|
||||
TokenFilters: []analysis.TokenFilter{
|
||||
elisionFilter,
|
||||
toLowerFilter,
|
||||
elisionFilter,
|
||||
stopFrFilter,
|
||||
stemmerFrFilter,
|
||||
},
|
||||
|
|
|
@ -43,8 +43,8 @@ func AnalyzerConstructor(config map[string]interface{}, cache *registry.Cache) (
|
|||
rv := analysis.Analyzer{
|
||||
Tokenizer: tokenizer,
|
||||
TokenFilters: []analysis.TokenFilter{
|
||||
elisionFilter,
|
||||
toLowerFilter,
|
||||
elisionFilter,
|
||||
stopItFilter,
|
||||
stemmerItFilter,
|
||||
},
|
||||
|
|
|
@ -61,6 +61,15 @@ func TestItalianAnalyzer(t *testing.T) {
|
|||
},
|
||||
},
|
||||
},
|
||||
// test for bug #218
|
||||
{
|
||||
input: []byte("Nell'anfora"),
|
||||
output: analysis.TokenStream{
|
||||
&analysis.Token{
|
||||
Term: []byte("anfor"),
|
||||
},
|
||||
},
|
||||
},
|
||||
}
|
||||
|
||||
cache := registry.NewCache()
|
||||
|
|
Loading…
Reference in New Issue
Block a user