![Marty Schoch](/assets/img/avatar_default.png)
this improvement was started to improve code coverage but also improves performance and adds support for escaping escaping: The following quoted string enumerates the characters which may be escaped. "+-=&|><!(){}[]^\"~*?:\\/ " Note that this list includes space. In order to escape these characters, they are prefixed with the \ (backslash) character. In all cases, using the escaped version produces the character itself and is not interpretted by the lexer. Two simple examples: my\ name Will be interpretted as a single argument to a match query with the value "my name". "contains a\" character" Will be interpretted as a single argument to a phrase query with the value `contains a " character`. Performance: before$ go test -v -run=xxx -bench=BenchmarkLexer BenchmarkLexer-4 100000 13991 ns/op PASS ok github.com/blevesearch/bleve 1.570s after$ go test -v -run=xxx -bench=BenchmarkLexer BenchmarkLexer-4 500000 3387 ns/op PASS ok github.com/blevesearch/bleve 1.740s
70 lines
1.6 KiB
Go
70 lines
1.6 KiB
Go
// Copyright (c) 2014 Couchbase, Inc.
|
|
// Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file
|
|
// except in compliance with the License. You may obtain a copy of the License at
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
// Unless required by applicable law or agreed to in writing, software distributed under the
|
|
// License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
|
|
// either express or implied. See the License for the specific language governing permissions
|
|
// and limitations under the License.
|
|
|
|
//go:generate go tool yacc -o query_string.y.go query_string.y
|
|
//go:generate sed -i "" -e 1d query_string.y.go
|
|
|
|
package bleve
|
|
|
|
import (
|
|
"fmt"
|
|
"strings"
|
|
)
|
|
|
|
var debugParser bool
|
|
var debugLexer bool
|
|
|
|
func parseQuerySyntax(query string) (rq Query, err error) {
|
|
lex := newLexerWrapper(newQueryStringLex(strings.NewReader(query)))
|
|
doParse(lex)
|
|
|
|
if len(lex.errs) > 0 {
|
|
return nil, fmt.Errorf(strings.Join(lex.errs, "\n"))
|
|
}
|
|
return lex.query, nil
|
|
}
|
|
|
|
func doParse(lex *lexerWrapper) {
|
|
defer func() {
|
|
r := recover()
|
|
if r != nil {
|
|
lex.errs = append(lex.errs, fmt.Sprintf("parse error: %v", r))
|
|
}
|
|
}()
|
|
|
|
yyParse(lex)
|
|
}
|
|
|
|
const (
|
|
queryShould = iota
|
|
queryMust
|
|
queryMustNot
|
|
)
|
|
|
|
type lexerWrapper struct {
|
|
lex yyLexer
|
|
errs []string
|
|
query *booleanQuery
|
|
}
|
|
|
|
func newLexerWrapper(lex yyLexer) *lexerWrapper {
|
|
return &lexerWrapper{
|
|
lex: lex,
|
|
query: NewBooleanQuery(nil, nil, nil),
|
|
}
|
|
}
|
|
|
|
func (l *lexerWrapper) Lex(lval *yySymType) int {
|
|
return l.lex.Lex(lval)
|
|
}
|
|
|
|
func (l *lexerWrapper) Error(s string) {
|
|
l.errs = append(l.errs, s)
|
|
}
|