2014-04-17 22:55:53 +02:00
|
|
|
// Copyright (c) 2014 Couchbase, Inc.
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file
|
|
|
|
// except in compliance with the License. You may obtain a copy of the License at
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
// Unless required by applicable law or agreed to in writing, software distributed under the
|
|
|
|
// License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
|
|
|
|
// either express or implied. See the License for the specific language governing permissions
|
|
|
|
// and limitations under the License.
|
2014-09-02 16:54:50 +02:00
|
|
|
|
2014-04-17 22:55:53 +02:00
|
|
|
package upside_down
|
|
|
|
|
|
|
|
import (
|
|
|
|
"os"
|
|
|
|
"reflect"
|
|
|
|
"testing"
|
|
|
|
|
2014-08-28 21:38:57 +02:00
|
|
|
"github.com/blevesearch/bleve/document"
|
|
|
|
"github.com/blevesearch/bleve/index"
|
2014-09-02 19:56:35 +02:00
|
|
|
"github.com/blevesearch/bleve/index/store/boltdb"
|
2014-04-17 22:55:53 +02:00
|
|
|
)
|
|
|
|
|
|
|
|
func TestIndexReader(t *testing.T) {
|
|
|
|
defer os.RemoveAll("test")
|
|
|
|
|
2014-09-02 19:56:35 +02:00
|
|
|
store, err := boltdb.Open("test", "bleve")
|
2014-09-24 14:13:14 +02:00
|
|
|
analysisQueue := NewAnalysisQueue(1)
|
|
|
|
idx := NewUpsideDownCouch(store, analysisQueue)
|
2014-05-09 22:37:04 +02:00
|
|
|
err = idx.Open()
|
2014-04-17 22:55:53 +02:00
|
|
|
if err != nil {
|
|
|
|
t.Errorf("error opening index: %v", err)
|
|
|
|
}
|
|
|
|
defer idx.Close()
|
|
|
|
|
2014-09-04 00:47:02 +02:00
|
|
|
var expectedCount uint64
|
2014-04-17 22:55:53 +02:00
|
|
|
doc := document.NewDocument("1")
|
2014-08-19 14:58:26 +02:00
|
|
|
doc.AddField(document.NewTextField("name", []uint64{}, []byte("test")))
|
2014-04-17 22:55:53 +02:00
|
|
|
err = idx.Update(doc)
|
|
|
|
if err != nil {
|
|
|
|
t.Errorf("Error updating index: %v", err)
|
|
|
|
}
|
2014-09-04 00:47:02 +02:00
|
|
|
expectedCount++
|
2014-04-17 22:55:53 +02:00
|
|
|
|
|
|
|
doc = document.NewDocument("2")
|
2014-08-19 14:58:26 +02:00
|
|
|
doc.AddField(document.NewTextFieldWithAnalyzer("name", []uint64{}, []byte("test test test"), testAnalyzer))
|
2014-09-03 19:02:10 +02:00
|
|
|
doc.AddField(document.NewTextFieldCustom("desc", []uint64{}, []byte("eat more rice"), document.IndexField|document.IncludeTermVectors, testAnalyzer))
|
2014-04-17 22:55:53 +02:00
|
|
|
err = idx.Update(doc)
|
|
|
|
if err != nil {
|
|
|
|
t.Errorf("Error updating index: %v", err)
|
|
|
|
}
|
2014-09-04 00:47:02 +02:00
|
|
|
expectedCount++
|
2014-04-17 22:55:53 +02:00
|
|
|
|
2014-10-31 14:40:23 +01:00
|
|
|
indexReader, err := idx.Reader()
|
|
|
|
if err != nil {
|
|
|
|
t.Error(err)
|
|
|
|
}
|
2014-09-12 23:21:35 +02:00
|
|
|
defer indexReader.Close()
|
|
|
|
|
2014-12-18 18:43:12 +01:00
|
|
|
// first look for a term that doesn't exist
|
2014-09-12 23:21:35 +02:00
|
|
|
reader, err := indexReader.TermFieldReader([]byte("nope"), "name")
|
2014-04-17 22:55:53 +02:00
|
|
|
if err != nil {
|
|
|
|
t.Errorf("Error accessing term field reader: %v", err)
|
|
|
|
}
|
|
|
|
count := reader.Count()
|
|
|
|
if count != 0 {
|
|
|
|
t.Errorf("Expected doc count to be: %d got: %d", 0, count)
|
|
|
|
}
|
|
|
|
reader.Close()
|
|
|
|
|
2014-09-12 23:21:35 +02:00
|
|
|
reader, err = indexReader.TermFieldReader([]byte("test"), "name")
|
2014-04-17 22:55:53 +02:00
|
|
|
if err != nil {
|
|
|
|
t.Errorf("Error accessing term field reader: %v", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
expectedCount = 2
|
|
|
|
count = reader.Count()
|
|
|
|
if count != expectedCount {
|
|
|
|
t.Errorf("Exptected doc count to be: %d got: %d", expectedCount, count)
|
|
|
|
}
|
|
|
|
|
|
|
|
var match *index.TermFieldDoc
|
|
|
|
var actualCount uint64
|
|
|
|
match, err = reader.Next()
|
|
|
|
for err == nil && match != nil {
|
|
|
|
match, err = reader.Next()
|
|
|
|
if err != nil {
|
|
|
|
t.Errorf("unexpected error reading next")
|
|
|
|
}
|
2014-09-04 00:47:02 +02:00
|
|
|
actualCount++
|
2014-04-17 22:55:53 +02:00
|
|
|
}
|
|
|
|
if actualCount != count {
|
|
|
|
t.Errorf("count was 2, but only saw %d", actualCount)
|
|
|
|
}
|
|
|
|
|
|
|
|
expectedMatch := &index.TermFieldDoc{
|
|
|
|
ID: "2",
|
|
|
|
Freq: 1,
|
|
|
|
Norm: 0.5773502588272095,
|
|
|
|
Vectors: []*index.TermFieldVector{
|
|
|
|
&index.TermFieldVector{
|
|
|
|
Field: "desc",
|
|
|
|
Pos: 3,
|
|
|
|
Start: 9,
|
|
|
|
End: 13,
|
|
|
|
},
|
|
|
|
},
|
|
|
|
}
|
2014-09-12 23:21:35 +02:00
|
|
|
tfr, err := indexReader.TermFieldReader([]byte("rice"), "desc")
|
2014-04-17 22:55:53 +02:00
|
|
|
if err != nil {
|
|
|
|
t.Errorf("unexpected error: %v", err)
|
|
|
|
}
|
|
|
|
match, err = tfr.Next()
|
|
|
|
if err != nil {
|
|
|
|
t.Errorf("unexpected error: %v", err)
|
|
|
|
}
|
|
|
|
if !reflect.DeepEqual(expectedMatch, match) {
|
|
|
|
t.Errorf("got %#v, expected %#v", match, expectedMatch)
|
|
|
|
}
|
2014-04-20 15:43:02 +02:00
|
|
|
reader.Close()
|
|
|
|
|
|
|
|
// now test usage of advance
|
2014-09-12 23:21:35 +02:00
|
|
|
reader, err = indexReader.TermFieldReader([]byte("test"), "name")
|
2014-04-20 15:43:02 +02:00
|
|
|
if err != nil {
|
|
|
|
t.Errorf("Error accessing term field reader: %v", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
match, err = reader.Advance("2")
|
|
|
|
if err != nil {
|
|
|
|
t.Errorf("unexpected error: %v", err)
|
|
|
|
}
|
2014-05-09 22:37:04 +02:00
|
|
|
if match == nil {
|
|
|
|
t.Fatalf("Expected match, got nil")
|
|
|
|
}
|
2014-04-20 15:43:02 +02:00
|
|
|
if match.ID != "2" {
|
|
|
|
t.Errorf("Expected ID '2', got '%s'", match.ID)
|
|
|
|
}
|
|
|
|
match, err = reader.Advance("3")
|
|
|
|
if err != nil {
|
|
|
|
t.Errorf("unexpected error: %v", err)
|
|
|
|
}
|
|
|
|
if match != nil {
|
|
|
|
t.Errorf("expected nil, got %v", match)
|
|
|
|
}
|
|
|
|
reader.Close()
|
|
|
|
|
2014-04-22 19:57:13 +02:00
|
|
|
// now test creating a reader for a field that doesn't exist
|
2014-09-12 23:21:35 +02:00
|
|
|
reader, err = indexReader.TermFieldReader([]byte("water"), "doesnotexist")
|
2014-04-22 19:57:13 +02:00
|
|
|
if err != nil {
|
|
|
|
t.Errorf("Error accessing term field reader: %v", err)
|
|
|
|
}
|
|
|
|
count = reader.Count()
|
|
|
|
if count != 0 {
|
|
|
|
t.Errorf("expected count 0 for reader of non-existant field")
|
|
|
|
}
|
|
|
|
match, err = reader.Next()
|
|
|
|
if err != nil {
|
|
|
|
t.Errorf("unexpected error: %v", err)
|
|
|
|
}
|
|
|
|
if match != nil {
|
|
|
|
t.Errorf("expected nil, got %v", match)
|
|
|
|
}
|
|
|
|
match, err = reader.Advance("anywhere")
|
|
|
|
if err != nil {
|
|
|
|
t.Errorf("unexpected error: %v", err)
|
|
|
|
}
|
|
|
|
if match != nil {
|
|
|
|
t.Errorf("expected nil, got %v", match)
|
|
|
|
}
|
|
|
|
|
2014-04-17 22:55:53 +02:00
|
|
|
}
|
2014-07-11 20:24:28 +02:00
|
|
|
|
|
|
|
func TestIndexDocIdReader(t *testing.T) {
|
|
|
|
defer os.RemoveAll("test")
|
|
|
|
|
2014-09-02 19:56:35 +02:00
|
|
|
store, err := boltdb.Open("test", "bleve")
|
2014-09-24 14:13:14 +02:00
|
|
|
analysisQueue := NewAnalysisQueue(1)
|
|
|
|
idx := NewUpsideDownCouch(store, analysisQueue)
|
2014-07-11 20:24:28 +02:00
|
|
|
err = idx.Open()
|
|
|
|
if err != nil {
|
|
|
|
t.Errorf("error opening index: %v", err)
|
|
|
|
}
|
|
|
|
defer idx.Close()
|
|
|
|
|
2014-09-04 00:47:02 +02:00
|
|
|
var expectedCount uint64
|
2014-07-11 20:24:28 +02:00
|
|
|
doc := document.NewDocument("1")
|
2014-08-19 14:58:26 +02:00
|
|
|
doc.AddField(document.NewTextField("name", []uint64{}, []byte("test")))
|
2014-07-11 20:24:28 +02:00
|
|
|
err = idx.Update(doc)
|
|
|
|
if err != nil {
|
|
|
|
t.Errorf("Error updating index: %v", err)
|
|
|
|
}
|
2014-09-04 00:47:02 +02:00
|
|
|
expectedCount++
|
2014-07-11 20:24:28 +02:00
|
|
|
|
|
|
|
doc = document.NewDocument("2")
|
2014-08-19 14:58:26 +02:00
|
|
|
doc.AddField(document.NewTextField("name", []uint64{}, []byte("test test test")))
|
2014-09-03 19:02:10 +02:00
|
|
|
doc.AddField(document.NewTextFieldWithIndexingOptions("desc", []uint64{}, []byte("eat more rice"), document.IndexField|document.IncludeTermVectors))
|
2014-07-11 20:24:28 +02:00
|
|
|
err = idx.Update(doc)
|
|
|
|
if err != nil {
|
|
|
|
t.Errorf("Error updating index: %v", err)
|
|
|
|
}
|
2014-09-04 00:47:02 +02:00
|
|
|
expectedCount++
|
2014-07-11 20:24:28 +02:00
|
|
|
|
2014-10-31 14:40:23 +01:00
|
|
|
indexReader, err := idx.Reader()
|
|
|
|
if err != nil {
|
|
|
|
t.Error(err)
|
|
|
|
}
|
2014-09-12 23:21:35 +02:00
|
|
|
defer indexReader.Close()
|
|
|
|
|
2014-07-11 20:24:28 +02:00
|
|
|
// first get all doc ids
|
2014-09-12 23:21:35 +02:00
|
|
|
reader, err := indexReader.DocIDReader("", "")
|
2014-07-11 20:24:28 +02:00
|
|
|
if err != nil {
|
|
|
|
t.Errorf("Error accessing doc id reader: %v", err)
|
|
|
|
}
|
2014-08-15 19:12:55 +02:00
|
|
|
defer reader.Close()
|
2014-07-11 20:24:28 +02:00
|
|
|
|
|
|
|
id, err := reader.Next()
|
|
|
|
count := uint64(0)
|
|
|
|
for id != "" {
|
|
|
|
count++
|
|
|
|
id, err = reader.Next()
|
|
|
|
}
|
|
|
|
if count != expectedCount {
|
|
|
|
t.Errorf("expected %d, got %d", expectedCount, count)
|
|
|
|
}
|
2014-08-15 19:12:55 +02:00
|
|
|
|
|
|
|
// try it again, but jump to the second doc this time
|
2014-09-12 23:21:35 +02:00
|
|
|
reader, err = indexReader.DocIDReader("", "")
|
2014-08-15 19:12:55 +02:00
|
|
|
if err != nil {
|
|
|
|
t.Errorf("Error accessing doc id reader: %v", err)
|
|
|
|
}
|
|
|
|
defer reader.Close()
|
|
|
|
|
|
|
|
id, err = reader.Advance("2")
|
|
|
|
if err != nil {
|
|
|
|
t.Error(err)
|
|
|
|
}
|
|
|
|
if id != "2" {
|
|
|
|
t.Errorf("expected to find id '2', got '%s'", id)
|
|
|
|
}
|
|
|
|
|
|
|
|
id, err = reader.Advance("3")
|
|
|
|
if err != nil {
|
|
|
|
t.Error(err)
|
|
|
|
}
|
|
|
|
if id != "" {
|
|
|
|
t.Errorf("expected to find id '', got '%s'", id)
|
|
|
|
}
|
2014-07-11 20:24:28 +02:00
|
|
|
}
|