2014-04-24 18:24:19 +02:00
|
|
|
// Copyright (c) 2014 Couchbase, Inc.
|
2016-10-02 16:13:14 +02:00
|
|
|
//
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
// you may not use this file except in compliance with the License.
|
|
|
|
// You may obtain a copy of the License at
|
|
|
|
//
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
2014-09-02 16:54:50 +02:00
|
|
|
|
2016-10-02 16:29:39 +02:00
|
|
|
package searcher
|
2014-04-24 18:24:19 +02:00
|
|
|
|
|
|
|
import (
|
2014-06-26 17:43:13 +02:00
|
|
|
"math"
|
2014-07-30 18:30:38 +02:00
|
|
|
"regexp"
|
2014-06-26 17:43:13 +02:00
|
|
|
|
2014-08-28 21:38:57 +02:00
|
|
|
"github.com/blevesearch/bleve/analysis"
|
2016-10-01 23:20:59 +02:00
|
|
|
regexpTokenizer "github.com/blevesearch/bleve/analysis/tokenizer/regexp"
|
2014-08-28 21:38:57 +02:00
|
|
|
"github.com/blevesearch/bleve/document"
|
|
|
|
"github.com/blevesearch/bleve/index"
|
2015-09-23 20:25:47 +02:00
|
|
|
"github.com/blevesearch/bleve/index/store/gtreap"
|
2016-09-30 17:30:17 +02:00
|
|
|
"github.com/blevesearch/bleve/index/upsidedown"
|
2014-04-24 18:24:19 +02:00
|
|
|
)
|
|
|
|
|
2014-06-26 17:43:13 +02:00
|
|
|
var twoDocIndex index.Index //= upside_down.NewUpsideDownCouch(inmem.MustOpen())
|
|
|
|
|
|
|
|
func init() {
|
2015-09-02 19:12:08 +02:00
|
|
|
analysisQueue := index.NewAnalysisQueue(1)
|
2015-09-23 20:25:47 +02:00
|
|
|
var err error
|
2016-09-30 17:30:17 +02:00
|
|
|
twoDocIndex, err = upsidedown.NewUpsideDownCouch(
|
BREAKING CHANGE - new method to create memory only index
Previously bleve allowed you to create a memory-only index by
simply passing "" as the path argument to the New() method.
This was not clear when reading the code, and led to some
problematic error cases as well.
Now, to create a memory-only index one should use the
NewMemOnly() method. Passing "" as the path argument
to the New() method will now return os.ErrInvalid.
Advanced users calling NewUsing() can create disk-based or
memory-only indexes, but the change here is that pass ""
as the path argument no longer defaults you into getting
a memory-only index. Instead, the KV store is selected
manually, just as it is for the disk-based solutions.
Here is an example use of the NewUsing() method to create
a memory-only index:
NewUsing("", indexMapping, Config.DefaultIndexType,
Config.DefaultMemKVStore, nil)
Config.DefaultMemKVStore is just a new default value
added to the configuration, it currently points to
gtreap.Name (which could have been used directly
instead for more control)
closes #427
2016-09-27 20:05:55 +02:00
|
|
|
gtreap.Name,
|
|
|
|
map[string]interface{}{
|
|
|
|
"path": "",
|
|
|
|
}, analysisQueue)
|
2015-09-23 20:25:47 +02:00
|
|
|
if err != nil {
|
|
|
|
panic(err)
|
|
|
|
}
|
|
|
|
err = twoDocIndex.Open()
|
2015-04-24 23:11:47 +02:00
|
|
|
if err != nil {
|
|
|
|
panic(err)
|
|
|
|
}
|
2014-06-26 17:43:13 +02:00
|
|
|
for _, doc := range twoDocIndexDocs {
|
2015-04-07 20:59:35 +02:00
|
|
|
err := twoDocIndex.Update(doc)
|
|
|
|
if err != nil {
|
|
|
|
panic(err)
|
|
|
|
}
|
2014-06-26 17:43:13 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-07-30 18:30:38 +02:00
|
|
|
// create a simpler analyzer which will support these tests
|
|
|
|
var testAnalyzer = &analysis.Analyzer{
|
2016-09-30 17:18:39 +02:00
|
|
|
Tokenizer: regexpTokenizer.NewRegexpTokenizer(regexp.MustCompile(`\w+`)),
|
2014-07-30 18:30:38 +02:00
|
|
|
}
|
|
|
|
|
2014-04-24 18:24:19 +02:00
|
|
|
// sets up some mock data used in many tests in this package
|
2014-09-03 19:02:10 +02:00
|
|
|
var twoDocIndexDescIndexingOptions = document.DefaultTextIndexingOptions | document.IncludeTermVectors
|
2014-04-24 18:24:19 +02:00
|
|
|
|
|
|
|
var twoDocIndexDocs = []*document.Document{
|
|
|
|
// must have 4/4 beer
|
|
|
|
document.NewDocument("1").
|
2014-08-19 14:58:26 +02:00
|
|
|
AddField(document.NewTextField("name", []uint64{}, []byte("marty"))).
|
|
|
|
AddField(document.NewTextFieldCustom("desc", []uint64{}, []byte("beer beer beer beer"), twoDocIndexDescIndexingOptions, testAnalyzer)).
|
|
|
|
AddField(document.NewTextFieldWithAnalyzer("street", []uint64{}, []byte("couchbase way"), testAnalyzer)),
|
2014-04-24 18:24:19 +02:00
|
|
|
// must have 1/4 beer
|
|
|
|
document.NewDocument("2").
|
2014-08-19 14:58:26 +02:00
|
|
|
AddField(document.NewTextField("name", []uint64{}, []byte("steve"))).
|
|
|
|
AddField(document.NewTextFieldCustom("desc", []uint64{}, []byte("angst beer couch database"), twoDocIndexDescIndexingOptions, testAnalyzer)).
|
|
|
|
AddField(document.NewTextFieldWithAnalyzer("street", []uint64{}, []byte("couchbase way"), testAnalyzer)).
|
|
|
|
AddField(document.NewTextFieldWithAnalyzer("title", []uint64{}, []byte("mister"), testAnalyzer)),
|
2014-04-24 18:24:19 +02:00
|
|
|
// must have 1/4 beer
|
|
|
|
document.NewDocument("3").
|
2014-08-19 14:58:26 +02:00
|
|
|
AddField(document.NewTextField("name", []uint64{}, []byte("dustin"))).
|
|
|
|
AddField(document.NewTextFieldCustom("desc", []uint64{}, []byte("apple beer column dank"), twoDocIndexDescIndexingOptions, testAnalyzer)).
|
|
|
|
AddField(document.NewTextFieldWithAnalyzer("title", []uint64{}, []byte("mister"), testAnalyzer)),
|
2014-04-24 18:24:19 +02:00
|
|
|
// must have 65/65 beer
|
|
|
|
document.NewDocument("4").
|
2014-08-19 14:58:26 +02:00
|
|
|
AddField(document.NewTextField("name", []uint64{}, []byte("ravi"))).
|
|
|
|
AddField(document.NewTextFieldCustom("desc", []uint64{}, []byte("beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer beer"), twoDocIndexDescIndexingOptions, testAnalyzer)),
|
2014-04-24 18:24:19 +02:00
|
|
|
// must have 0/x beer
|
|
|
|
document.NewDocument("5").
|
2014-08-19 14:58:26 +02:00
|
|
|
AddField(document.NewTextField("name", []uint64{}, []byte("bobert"))).
|
|
|
|
AddField(document.NewTextFieldCustom("desc", []uint64{}, []byte("water"), twoDocIndexDescIndexingOptions, testAnalyzer)).
|
|
|
|
AddField(document.NewTextFieldWithAnalyzer("title", []uint64{}, []byte("mister"), testAnalyzer)),
|
2014-04-24 18:24:19 +02:00
|
|
|
}
|
|
|
|
|
2014-06-26 17:43:13 +02:00
|
|
|
func scoresCloseEnough(a, b float64) bool {
|
|
|
|
return math.Abs(a-b) < 0.001
|
|
|
|
}
|