2016-10-02 16:13:14 +02:00
|
|
|
// Copyright (c) 2016 Couchbase, Inc.
|
|
|
|
//
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
// you may not use this file except in compliance with the License.
|
|
|
|
// You may obtain a copy of the License at
|
|
|
|
//
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
2016-08-20 20:03:46 +02:00
|
|
|
|
|
|
|
package smolder
|
|
|
|
|
|
|
|
import (
|
|
|
|
"fmt"
|
|
|
|
|
|
|
|
"github.com/blevesearch/bleve/document"
|
|
|
|
"github.com/blevesearch/bleve/index"
|
|
|
|
"github.com/blevesearch/bleve/index/store"
|
|
|
|
)
|
|
|
|
|
|
|
|
type IndexReader struct {
|
|
|
|
index *SmolderingCouch
|
|
|
|
kvreader store.KVReader
|
|
|
|
docCount uint64
|
|
|
|
}
|
|
|
|
|
|
|
|
func (i *IndexReader) TermFieldReader(term []byte, fieldName string, includeFreq, includeNorm, includeTermVectors bool) (index.TermFieldReader, error) {
|
|
|
|
fieldIndex, fieldExists := i.index.fieldCache.FieldNamed(fieldName, false)
|
|
|
|
if fieldExists {
|
|
|
|
return newSmolderingCouchTermFieldReader(i, term, uint16(fieldIndex), includeFreq, includeNorm, includeTermVectors)
|
|
|
|
}
|
|
|
|
return newSmolderingCouchTermFieldReader(i, []byte{ByteSeparator}, ^uint16(0), includeFreq, includeNorm, includeTermVectors)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (i *IndexReader) FieldDict(fieldName string) (index.FieldDict, error) {
|
|
|
|
return i.FieldDictRange(fieldName, nil, nil)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (i *IndexReader) FieldDictRange(fieldName string, startTerm []byte, endTerm []byte) (index.FieldDict, error) {
|
|
|
|
fieldIndex, fieldExists := i.index.fieldCache.FieldNamed(fieldName, false)
|
|
|
|
if fieldExists {
|
|
|
|
return newSmolderingCouchFieldDict(i, uint16(fieldIndex), startTerm, endTerm)
|
|
|
|
}
|
|
|
|
return newSmolderingCouchFieldDict(i, ^uint16(0), []byte{ByteSeparator}, []byte{})
|
|
|
|
}
|
|
|
|
|
|
|
|
func (i *IndexReader) FieldDictPrefix(fieldName string, termPrefix []byte) (index.FieldDict, error) {
|
|
|
|
return i.FieldDictRange(fieldName, termPrefix, termPrefix)
|
|
|
|
}
|
|
|
|
|
2016-09-09 17:04:11 +02:00
|
|
|
func (i *IndexReader) DocIDReaderAll() (index.DocIDReader, error) {
|
|
|
|
return newSmolderingCouchDocIDReader(i)
|
2016-08-20 20:03:46 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
func (i *IndexReader) DocIDReaderOnly(ids []string) (index.DocIDReader, error) {
|
|
|
|
return newSmolderingCouchDocIDReaderOnly(i, ids)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (i *IndexReader) Document(id string) (doc *document.Document, err error) {
|
|
|
|
|
|
|
|
// first hit the back index to confirm doc exists
|
|
|
|
var backIndexRow *BackIndexRow
|
2016-09-13 18:40:01 +02:00
|
|
|
backIndexRow, err = i.backIndexRowForDoc(nil, id)
|
2016-08-20 20:03:46 +02:00
|
|
|
if err != nil {
|
|
|
|
return
|
|
|
|
}
|
|
|
|
if backIndexRow == nil {
|
|
|
|
return
|
|
|
|
}
|
|
|
|
doc = document.NewDocument(id)
|
|
|
|
storedRowScanPrefix := NewStoredRowDocBytes(backIndexRow.docNumber, 0, []uint64{}, 'x', nil).ScanPrefixForDoc()
|
|
|
|
it := i.kvreader.PrefixIterator(storedRowScanPrefix)
|
|
|
|
defer func() {
|
|
|
|
if cerr := it.Close(); err == nil && cerr != nil {
|
|
|
|
err = cerr
|
|
|
|
}
|
|
|
|
}()
|
|
|
|
key, val, valid := it.Current()
|
|
|
|
for valid {
|
|
|
|
safeVal := make([]byte, len(val))
|
|
|
|
copy(safeVal, val)
|
|
|
|
var row *StoredRow
|
|
|
|
row, err = NewStoredRowKV(key, safeVal)
|
|
|
|
if err != nil {
|
|
|
|
doc = nil
|
|
|
|
return
|
|
|
|
}
|
|
|
|
if row != nil {
|
|
|
|
fieldName := i.index.fieldCache.FieldIndexed(row.field)
|
|
|
|
field := decodeFieldType(row.typ, fieldName, row.arrayPositions, row.value)
|
|
|
|
if field != nil {
|
|
|
|
doc.AddField(field)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
it.Next()
|
|
|
|
key, val, valid = it.Current()
|
|
|
|
}
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2016-09-09 20:11:28 +02:00
|
|
|
func (i *IndexReader) DocumentFieldTerms(id index.IndexInternalID, fields []string) (index.FieldTerms, error) {
|
2016-09-13 18:40:01 +02:00
|
|
|
back, err := i.backIndexRowForDoc(id, "")
|
2016-08-20 20:03:46 +02:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
if back == nil {
|
|
|
|
return nil, nil
|
|
|
|
}
|
|
|
|
rv := make(index.FieldTerms, len(fields))
|
|
|
|
fieldsMap := make(map[uint16]string, len(fields))
|
|
|
|
for _, f := range fields {
|
|
|
|
id, ok := i.index.fieldCache.FieldNamed(f, false)
|
|
|
|
if !ok {
|
|
|
|
return nil, fmt.Errorf("Field %s was not found in cache", f)
|
|
|
|
}
|
|
|
|
fieldsMap[id] = f
|
|
|
|
}
|
2016-09-09 17:04:11 +02:00
|
|
|
for _, entry := range back.termsEntries {
|
2016-08-20 20:03:46 +02:00
|
|
|
if field, ok := fieldsMap[uint16(*entry.Field)]; ok {
|
2016-09-09 17:04:11 +02:00
|
|
|
rv[field] = entry.Terms
|
2016-08-20 20:03:46 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
return rv, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (i *IndexReader) Fields() (fields []string, err error) {
|
|
|
|
fields = make([]string, 0)
|
|
|
|
it := i.kvreader.PrefixIterator([]byte{'f'})
|
|
|
|
defer func() {
|
|
|
|
if cerr := it.Close(); err == nil && cerr != nil {
|
|
|
|
err = cerr
|
|
|
|
}
|
|
|
|
}()
|
|
|
|
key, val, valid := it.Current()
|
|
|
|
for valid {
|
|
|
|
var row SmolderingCouchRow
|
|
|
|
row, err = ParseFromKeyValue(key, val)
|
|
|
|
if err != nil {
|
|
|
|
fields = nil
|
|
|
|
return
|
|
|
|
}
|
|
|
|
if row != nil {
|
|
|
|
fieldRow, ok := row.(*FieldRow)
|
|
|
|
if ok {
|
|
|
|
fields = append(fields, fieldRow.name)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
it.Next()
|
|
|
|
key, val, valid = it.Current()
|
|
|
|
}
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
func (i *IndexReader) GetInternal(key []byte) ([]byte, error) {
|
|
|
|
internalRow := NewInternalRow(key, nil)
|
|
|
|
return i.kvreader.Get(internalRow.Key())
|
|
|
|
}
|
|
|
|
|
2016-09-13 18:40:01 +02:00
|
|
|
func (i *IndexReader) DocCount() (uint64, error) {
|
|
|
|
return i.docCount, nil
|
2016-08-20 20:03:46 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
func (i *IndexReader) Close() error {
|
|
|
|
return i.kvreader.Close()
|
|
|
|
}
|
|
|
|
|
|
|
|
func (i *IndexReader) ExternalID(id index.IndexInternalID) (string, error) {
|
2016-09-07 23:32:59 +02:00
|
|
|
k := StoredRowDocFieldKey(id, 0)
|
|
|
|
v, err := i.kvreader.Get(k)
|
2016-08-20 20:03:46 +02:00
|
|
|
if err != nil {
|
|
|
|
return "", err
|
|
|
|
}
|
2016-09-07 23:32:59 +02:00
|
|
|
return string(v[1:]), nil
|
2016-08-20 20:03:46 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
func (i *IndexReader) InternalID(id string) (index.IndexInternalID, error) {
|
|
|
|
tfr, err := i.TermFieldReader([]byte(id), "_id", false, false, false)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
if tfr.Count() < 1 {
|
|
|
|
return nil, nil
|
|
|
|
}
|
2016-09-09 21:56:29 +02:00
|
|
|
pre := index.TermFieldDoc{}
|
|
|
|
tfd, err := tfr.Next(&pre)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2016-08-20 20:03:46 +02:00
|
|
|
return tfd.ID, nil
|
|
|
|
}
|
|
|
|
|
2016-09-13 18:40:01 +02:00
|
|
|
func (i *IndexReader) backIndexRowForDoc(docID index.IndexInternalID, externalDocID string) (*BackIndexRow, error) {
|
|
|
|
|
|
|
|
var err error
|
|
|
|
// first look up the docID if it isn't known
|
|
|
|
if docID == nil {
|
|
|
|
// first get the internal identifier
|
|
|
|
docID, err = i.InternalID(externalDocID)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if len(docID) < 1 {
|
|
|
|
return nil, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// use a temporary row structure to build key
|
|
|
|
tempRow := &BackIndexRow{
|
|
|
|
docNumber: docID,
|
|
|
|
}
|
|
|
|
|
|
|
|
keyBuf := GetRowBuffer()
|
|
|
|
if tempRow.KeySize() > len(keyBuf) {
|
|
|
|
keyBuf = make([]byte, 2*tempRow.KeySize())
|
|
|
|
}
|
|
|
|
defer PutRowBuffer(keyBuf)
|
|
|
|
keySize, err := tempRow.KeyTo(keyBuf)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
value, err := i.kvreader.Get(keyBuf[:keySize])
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
if value == nil {
|
|
|
|
return nil, nil
|
|
|
|
}
|
|
|
|
backIndexRow, err := NewBackIndexRowKV(keyBuf[:keySize], value)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
return backIndexRow, nil
|
|
|
|
}
|
|
|
|
|
2016-08-20 20:03:46 +02:00
|
|
|
func incrementBytes(in []byte) []byte {
|
|
|
|
rv := make([]byte, len(in))
|
|
|
|
copy(rv, in)
|
|
|
|
for i := len(rv) - 1; i >= 0; i-- {
|
|
|
|
rv[i] = rv[i] + 1
|
|
|
|
if rv[i] != 0 {
|
|
|
|
// didn't overflow, so stop
|
|
|
|
break
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return rv
|
|
|
|
}
|