2016-10-02 16:13:14 +02:00
|
|
|
// Copyright (c) 2016 Couchbase, Inc.
|
|
|
|
//
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
// you may not use this file except in compliance with the License.
|
|
|
|
// You may obtain a copy of the License at
|
|
|
|
//
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
2016-08-20 20:03:46 +02:00
|
|
|
|
|
|
|
package smolder
|
|
|
|
|
|
|
|
import (
|
|
|
|
"sync/atomic"
|
|
|
|
|
|
|
|
"github.com/blevesearch/bleve/index"
|
|
|
|
"github.com/blevesearch/bleve/index/store"
|
|
|
|
)
|
|
|
|
|
|
|
|
type SmolderingCouchTermFieldReader struct {
|
|
|
|
count uint64
|
|
|
|
indexReader *IndexReader
|
|
|
|
iterator store.KVIterator
|
|
|
|
term []byte
|
|
|
|
tfrNext *TermFrequencyRow
|
|
|
|
field uint16
|
|
|
|
}
|
|
|
|
|
|
|
|
func newSmolderingCouchTermFieldReader(indexReader *IndexReader, term []byte, field uint16, includeFreq, includeNorm, includeTermVectors bool) (*SmolderingCouchTermFieldReader, error) {
|
|
|
|
dictionaryRow := NewDictionaryRow(term, field, 0)
|
|
|
|
val, err := indexReader.kvreader.Get(dictionaryRow.Key())
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
if val == nil {
|
|
|
|
atomic.AddUint64(&indexReader.index.stats.termSearchersStarted, uint64(1))
|
|
|
|
return &SmolderingCouchTermFieldReader{
|
|
|
|
count: 0,
|
|
|
|
term: term,
|
|
|
|
tfrNext: &TermFrequencyRow{},
|
|
|
|
field: field,
|
|
|
|
}, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
err = dictionaryRow.parseDictionaryV(val)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2016-09-07 23:32:59 +02:00
|
|
|
tfrk := TermFrequencyRowStart(term, field, []byte{})
|
|
|
|
it := indexReader.kvreader.PrefixIterator(tfrk)
|
2016-08-20 20:03:46 +02:00
|
|
|
|
|
|
|
atomic.AddUint64(&indexReader.index.stats.termSearchersStarted, uint64(1))
|
|
|
|
return &SmolderingCouchTermFieldReader{
|
|
|
|
indexReader: indexReader,
|
|
|
|
iterator: it,
|
|
|
|
count: dictionaryRow.count,
|
|
|
|
term: term,
|
|
|
|
tfrNext: &TermFrequencyRow{},
|
|
|
|
field: field,
|
|
|
|
}, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (r *SmolderingCouchTermFieldReader) Count() uint64 {
|
|
|
|
return r.count
|
|
|
|
}
|
|
|
|
|
|
|
|
func (r *SmolderingCouchTermFieldReader) Next(preAlloced *index.TermFieldDoc) (*index.TermFieldDoc, error) {
|
|
|
|
if r.iterator != nil {
|
|
|
|
key, val, valid := r.iterator.Current()
|
|
|
|
if valid {
|
|
|
|
tfr := r.tfrNext
|
|
|
|
err := tfr.parseKDoc(key)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
err = tfr.parseV(val)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
rv := preAlloced
|
|
|
|
if rv == nil {
|
|
|
|
rv = &index.TermFieldDoc{}
|
|
|
|
}
|
|
|
|
rv.ID = append(rv.ID, tfr.docNumber...)
|
|
|
|
rv.Freq = tfr.freq
|
|
|
|
rv.Norm = float64(tfr.norm)
|
|
|
|
if tfr.vectors != nil {
|
|
|
|
rv.Vectors = r.indexReader.index.termFieldVectorsFromTermVectors(tfr.vectors)
|
|
|
|
}
|
|
|
|
r.iterator.Next()
|
|
|
|
return rv, nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return nil, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (r *SmolderingCouchTermFieldReader) Advance(docID index.IndexInternalID, preAlloced *index.TermFieldDoc) (*index.TermFieldDoc, error) {
|
|
|
|
if r.iterator != nil {
|
2016-09-07 23:32:59 +02:00
|
|
|
tfrk := TermFrequencyRowStart(r.term, r.field, docID)
|
|
|
|
r.iterator.Seek(tfrk)
|
2016-08-20 20:03:46 +02:00
|
|
|
key, val, valid := r.iterator.Current()
|
|
|
|
if valid {
|
|
|
|
tfr, err := NewTermFrequencyRowKV(key, val)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
rv := preAlloced
|
|
|
|
if rv == nil {
|
|
|
|
rv = &index.TermFieldDoc{}
|
|
|
|
}
|
|
|
|
rv.ID = append(rv.ID, tfr.docNumber...)
|
|
|
|
rv.Freq = tfr.freq
|
|
|
|
rv.Norm = float64(tfr.norm)
|
|
|
|
if tfr.vectors != nil {
|
|
|
|
rv.Vectors = r.indexReader.index.termFieldVectorsFromTermVectors(tfr.vectors)
|
|
|
|
}
|
|
|
|
r.iterator.Next()
|
|
|
|
return rv, nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return nil, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (r *SmolderingCouchTermFieldReader) Close() error {
|
2016-09-30 23:08:04 +02:00
|
|
|
if r.indexReader != nil {
|
|
|
|
atomic.AddUint64(&r.indexReader.index.stats.termSearchersFinished, uint64(1))
|
|
|
|
}
|
2016-08-20 20:03:46 +02:00
|
|
|
if r.iterator != nil {
|
|
|
|
return r.iterator.Close()
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
type SmolderingCouchDocIDReader struct {
|
|
|
|
indexReader *IndexReader
|
|
|
|
iterator store.KVIterator
|
2016-09-02 01:13:44 +02:00
|
|
|
only map[string]struct{}
|
2016-08-20 20:03:46 +02:00
|
|
|
onlyMode bool
|
|
|
|
}
|
|
|
|
|
2016-09-09 17:04:11 +02:00
|
|
|
func newSmolderingCouchDocIDReader(indexReader *IndexReader) (*SmolderingCouchDocIDReader, error) {
|
|
|
|
|
|
|
|
startBytes := []byte{0x0}
|
|
|
|
endBytes := []byte{0xff}
|
2016-08-20 20:03:46 +02:00
|
|
|
bisrk := BackIndexRowKey(startBytes)
|
|
|
|
bierk := BackIndexRowKey(endBytes)
|
|
|
|
it := indexReader.kvreader.RangeIterator(bisrk, bierk)
|
|
|
|
|
|
|
|
return &SmolderingCouchDocIDReader{
|
|
|
|
indexReader: indexReader,
|
|
|
|
iterator: it,
|
|
|
|
}, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func newSmolderingCouchDocIDReaderOnly(indexReader *IndexReader, ids []string) (*SmolderingCouchDocIDReader, error) {
|
2016-09-02 01:13:44 +02:00
|
|
|
// put ids into map
|
|
|
|
only := make(map[string]struct{}, len(ids))
|
|
|
|
for i := range ids {
|
|
|
|
only[ids[i]] = struct{}{}
|
2016-08-20 20:03:46 +02:00
|
|
|
}
|
2016-09-02 01:13:44 +02:00
|
|
|
|
|
|
|
startBytes := []byte{0x0}
|
2016-08-20 20:03:46 +02:00
|
|
|
endBytes := []byte{0xff}
|
|
|
|
bisrk := BackIndexRowKey(startBytes)
|
|
|
|
bierk := BackIndexRowKey(endBytes)
|
|
|
|
it := indexReader.kvreader.RangeIterator(bisrk, bierk)
|
|
|
|
|
|
|
|
return &SmolderingCouchDocIDReader{
|
|
|
|
indexReader: indexReader,
|
|
|
|
iterator: it,
|
2016-09-02 01:13:44 +02:00
|
|
|
only: only,
|
2016-08-20 20:03:46 +02:00
|
|
|
onlyMode: true,
|
|
|
|
}, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (r *SmolderingCouchDocIDReader) Next() (index.IndexInternalID, error) {
|
|
|
|
key, val, valid := r.iterator.Current()
|
|
|
|
|
|
|
|
if r.onlyMode {
|
|
|
|
var rv index.IndexInternalID
|
2016-09-02 01:13:44 +02:00
|
|
|
for valid {
|
2016-08-20 20:03:46 +02:00
|
|
|
br, err := NewBackIndexRowKV(key, val)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2016-09-02 01:13:44 +02:00
|
|
|
|
|
|
|
// find doc id
|
2016-09-09 17:04:11 +02:00
|
|
|
for _, te := range br.termsEntries {
|
2016-09-02 01:13:44 +02:00
|
|
|
if te.GetField() == 0 {
|
2016-09-09 17:04:11 +02:00
|
|
|
for i := range te.Terms {
|
|
|
|
if _, ok := r.only[te.Terms[i]]; ok {
|
|
|
|
rv = append([]byte(nil), br.docNumber...)
|
|
|
|
r.iterator.Next()
|
|
|
|
return rv, nil
|
|
|
|
}
|
2016-09-02 01:13:44 +02:00
|
|
|
}
|
|
|
|
break
|
2016-08-20 20:03:46 +02:00
|
|
|
}
|
|
|
|
}
|
2016-09-02 01:13:44 +02:00
|
|
|
r.iterator.Next()
|
|
|
|
key, val, valid = r.iterator.Current()
|
2016-08-20 20:03:46 +02:00
|
|
|
}
|
|
|
|
} else {
|
|
|
|
if valid {
|
|
|
|
br, err := NewBackIndexRowKV(key, val)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
rv := append([]byte(nil), br.docNumber...)
|
|
|
|
r.iterator.Next()
|
|
|
|
return rv, nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return nil, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (r *SmolderingCouchDocIDReader) Advance(docID index.IndexInternalID) (index.IndexInternalID, error) {
|
|
|
|
birk := BackIndexRowKey(docID)
|
|
|
|
r.iterator.Seek(birk)
|
|
|
|
key, val, valid := r.iterator.Current()
|
|
|
|
|
|
|
|
if r.onlyMode {
|
|
|
|
var rv index.IndexInternalID
|
2016-09-02 01:13:44 +02:00
|
|
|
for valid {
|
2016-08-20 20:03:46 +02:00
|
|
|
br, err := NewBackIndexRowKV(key, val)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2016-09-02 01:13:44 +02:00
|
|
|
|
|
|
|
// find doc id
|
2016-09-09 17:04:11 +02:00
|
|
|
for _, te := range br.termsEntries {
|
2016-09-02 01:13:44 +02:00
|
|
|
if te.GetField() == 0 {
|
2016-09-09 17:04:11 +02:00
|
|
|
for i := range te.Terms {
|
|
|
|
if _, ok := r.only[te.Terms[i]]; ok {
|
|
|
|
rv = append([]byte(nil), br.docNumber...)
|
|
|
|
r.iterator.Next()
|
|
|
|
return rv, nil
|
|
|
|
}
|
2016-09-02 01:13:44 +02:00
|
|
|
}
|
|
|
|
break
|
2016-08-20 20:03:46 +02:00
|
|
|
}
|
|
|
|
}
|
2016-09-02 01:13:44 +02:00
|
|
|
r.iterator.Next()
|
|
|
|
key, val, valid = r.iterator.Current()
|
2016-08-20 20:03:46 +02:00
|
|
|
}
|
|
|
|
} else {
|
|
|
|
if valid {
|
|
|
|
br, err := NewBackIndexRowKV(key, val)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
rv := append([]byte(nil), br.docNumber...)
|
|
|
|
r.iterator.Next()
|
|
|
|
return rv, nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return nil, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (r *SmolderingCouchDocIDReader) Close() error {
|
|
|
|
return r.iterator.Close()
|
|
|
|
}
|