3247 lines
73 KiB
Go
3247 lines
73 KiB
Go
// Copyright (c) 2014 Couchbase, Inc.
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
package bleve
|
|
|
|
import (
|
|
"context"
|
|
"encoding/json"
|
|
"fmt"
|
|
"io"
|
|
"log"
|
|
"math"
|
|
"os"
|
|
"path/filepath"
|
|
"reflect"
|
|
"sort"
|
|
"strconv"
|
|
"strings"
|
|
"sync"
|
|
"testing"
|
|
"time"
|
|
|
|
"github.com/blevesearch/bleve/v2/analysis/analyzer/keyword"
|
|
"github.com/blevesearch/bleve/v2/document"
|
|
"github.com/blevesearch/bleve/v2/index/upsidedown/store/boltdb"
|
|
"github.com/blevesearch/bleve/v2/index/upsidedown/store/null"
|
|
"github.com/blevesearch/bleve/v2/mapping"
|
|
"github.com/blevesearch/bleve/v2/search"
|
|
"github.com/blevesearch/bleve/v2/search/query"
|
|
index "github.com/blevesearch/bleve_index_api"
|
|
|
|
"github.com/blevesearch/bleve/v2/index/scorch"
|
|
"github.com/blevesearch/bleve/v2/index/upsidedown"
|
|
)
|
|
|
|
type Fatalfable interface {
|
|
Fatalf(format string, args ...interface{})
|
|
}
|
|
|
|
func createTmpIndexPath(f Fatalfable) string {
|
|
tmpIndexPath, err := os.MkdirTemp("", "bleve-testidx")
|
|
if err != nil {
|
|
f.Fatalf("error creating temp dir: %v", err)
|
|
}
|
|
return tmpIndexPath
|
|
}
|
|
|
|
func cleanupTmpIndexPath(f Fatalfable, path string) {
|
|
err := os.RemoveAll(path)
|
|
if err != nil {
|
|
f.Fatalf("error removing temp dir: %v", err)
|
|
}
|
|
}
|
|
|
|
func TestCrud(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
idx, err := New(tmpIndexPath, NewIndexMapping())
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
doca := map[string]interface{}{
|
|
"name": "marty",
|
|
"desc": "gophercon india",
|
|
}
|
|
err = idx.Index("a", doca)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
docy := map[string]interface{}{
|
|
"name": "jasper",
|
|
"desc": "clojure",
|
|
}
|
|
err = idx.Index("y", docy)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
err = idx.Delete("y")
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
docx := map[string]interface{}{
|
|
"name": "rose",
|
|
"desc": "googler",
|
|
}
|
|
err = idx.Index("x", docx)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
err = idx.SetInternal([]byte("status"), []byte("pending"))
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
docb := map[string]interface{}{
|
|
"name": "steve",
|
|
"desc": "cbft master",
|
|
}
|
|
batch := idx.NewBatch()
|
|
err = batch.Index("b", docb)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
batch.Delete("x")
|
|
batch.SetInternal([]byte("batchi"), []byte("batchv"))
|
|
batch.DeleteInternal([]byte("status"))
|
|
err = idx.Batch(batch)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
val, err := idx.GetInternal([]byte("batchi"))
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
if string(val) != "batchv" {
|
|
t.Errorf("expected 'batchv', got '%s'", val)
|
|
}
|
|
val, err = idx.GetInternal([]byte("status"))
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
if val != nil {
|
|
t.Errorf("expected nil, got '%s'", val)
|
|
}
|
|
|
|
err = idx.SetInternal([]byte("seqno"), []byte("7"))
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
err = idx.SetInternal([]byte("status"), []byte("ready"))
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
err = idx.DeleteInternal([]byte("status"))
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
val, err = idx.GetInternal([]byte("status"))
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
if val != nil {
|
|
t.Errorf("expected nil, got '%s'", val)
|
|
}
|
|
|
|
val, err = idx.GetInternal([]byte("seqno"))
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
if string(val) != "7" {
|
|
t.Errorf("expected '7', got '%s'", val)
|
|
}
|
|
|
|
// close the index, open it again, and try some more things
|
|
err = idx.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
idx, err = Open(tmpIndexPath)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
defer func() {
|
|
err := idx.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}()
|
|
|
|
count, err := idx.DocCount()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if count != 2 {
|
|
t.Errorf("expected doc count 2, got %d", count)
|
|
}
|
|
|
|
doc, err := idx.Document("a")
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
foundNameField := false
|
|
doc.VisitFields(func(field index.Field) {
|
|
if field.Name() == "name" && string(field.Value()) == "marty" {
|
|
foundNameField = true
|
|
}
|
|
})
|
|
if !foundNameField {
|
|
t.Errorf("expected to find field named 'name' with value 'marty'")
|
|
}
|
|
|
|
fields, err := idx.Fields()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
expectedFields := map[string]bool{
|
|
"_all": false,
|
|
"name": false,
|
|
"desc": false,
|
|
}
|
|
if len(fields) < len(expectedFields) {
|
|
t.Fatalf("expected %d fields got %d", len(expectedFields), len(fields))
|
|
}
|
|
for _, f := range fields {
|
|
expectedFields[f] = true
|
|
}
|
|
for ef, efp := range expectedFields {
|
|
if !efp {
|
|
t.Errorf("field %s is missing", ef)
|
|
}
|
|
}
|
|
}
|
|
|
|
func approxSame(actual, expected uint64) bool {
|
|
modulus := func(a, b uint64) uint64 {
|
|
if a > b {
|
|
return a - b
|
|
}
|
|
return b - a
|
|
}
|
|
|
|
return float64(modulus(actual, expected))/float64(expected) < float64(0.30)
|
|
}
|
|
|
|
func checkStatsOnIndexedBatch(indexPath string, indexMapping mapping.IndexMapping,
|
|
expectedVal uint64,
|
|
) error {
|
|
var wg sync.WaitGroup
|
|
var statValError error
|
|
|
|
idx, err := NewUsing(indexPath, indexMapping, Config.DefaultIndexType, Config.DefaultMemKVStore, nil)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
batch, err := getBatchFromData(idx, "sample-data.json")
|
|
if err != nil {
|
|
return fmt.Errorf("failed to form a batch %v\n", err)
|
|
}
|
|
wg.Add(1)
|
|
batch.SetPersistedCallback(func(e error) {
|
|
defer wg.Done()
|
|
stats, _ := idx.StatsMap()["index"].(map[string]interface{})
|
|
bytesWritten, _ := stats["num_bytes_written_at_index_time"].(uint64)
|
|
if !approxSame(bytesWritten, expectedVal) {
|
|
statValError = fmt.Errorf("expected bytes written is %d, got %v", expectedVal,
|
|
bytesWritten)
|
|
}
|
|
})
|
|
err = idx.Batch(batch)
|
|
if err != nil {
|
|
return fmt.Errorf("failed to index batch %v\n", err)
|
|
}
|
|
wg.Wait()
|
|
idx.Close()
|
|
|
|
return statValError
|
|
}
|
|
|
|
func TestBytesWritten(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
|
|
indexMapping := NewIndexMapping()
|
|
indexMapping.TypeField = "type"
|
|
indexMapping.DefaultAnalyzer = "en"
|
|
documentMapping := NewDocumentMapping()
|
|
indexMapping.AddDocumentMapping("hotel", documentMapping)
|
|
|
|
indexMapping.DocValuesDynamic = false
|
|
indexMapping.StoreDynamic = false
|
|
|
|
contentFieldMapping := NewTextFieldMapping()
|
|
contentFieldMapping.Index = true
|
|
contentFieldMapping.Store = false
|
|
contentFieldMapping.IncludeInAll = false
|
|
contentFieldMapping.IncludeTermVectors = false
|
|
contentFieldMapping.DocValues = false
|
|
|
|
reviewsMapping := NewDocumentMapping()
|
|
reviewsMapping.AddFieldMappingsAt("content", contentFieldMapping)
|
|
documentMapping.AddSubDocumentMapping("reviews", reviewsMapping)
|
|
|
|
typeFieldMapping := NewTextFieldMapping()
|
|
typeFieldMapping.Store = false
|
|
typeFieldMapping.IncludeInAll = false
|
|
typeFieldMapping.IncludeTermVectors = false
|
|
typeFieldMapping.DocValues = false
|
|
documentMapping.AddFieldMappingsAt("type", typeFieldMapping)
|
|
|
|
err = checkStatsOnIndexedBatch(tmpIndexPath, indexMapping, 57273)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
contentFieldMapping.Store = true
|
|
tmpIndexPath1 := createTmpIndexPath(t)
|
|
|
|
err := checkStatsOnIndexedBatch(tmpIndexPath1, indexMapping, 76069)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
cleanupTmpIndexPath(t, tmpIndexPath1)
|
|
|
|
contentFieldMapping.Store = false
|
|
contentFieldMapping.IncludeInAll = true
|
|
tmpIndexPath2 := createTmpIndexPath(t)
|
|
|
|
err = checkStatsOnIndexedBatch(tmpIndexPath2, indexMapping, 68875)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
cleanupTmpIndexPath(t, tmpIndexPath2)
|
|
|
|
contentFieldMapping.IncludeInAll = false
|
|
contentFieldMapping.IncludeTermVectors = true
|
|
tmpIndexPath3 := createTmpIndexPath(t)
|
|
|
|
err = checkStatsOnIndexedBatch(tmpIndexPath3, indexMapping, 78985)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
cleanupTmpIndexPath(t, tmpIndexPath3)
|
|
|
|
contentFieldMapping.IncludeTermVectors = false
|
|
contentFieldMapping.DocValues = true
|
|
tmpIndexPath4 := createTmpIndexPath(t)
|
|
|
|
err = checkStatsOnIndexedBatch(tmpIndexPath4, indexMapping, 64228)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
cleanupTmpIndexPath(t, tmpIndexPath4)
|
|
}
|
|
|
|
func createIndexMappingOnSampleData() *mapping.IndexMappingImpl {
|
|
indexMapping := NewIndexMapping()
|
|
indexMapping.TypeField = "type"
|
|
indexMapping.DefaultAnalyzer = "en"
|
|
indexMapping.ScoringModel = index.DefaultScoringModel
|
|
documentMapping := NewDocumentMapping()
|
|
indexMapping.AddDocumentMapping("hotel", documentMapping)
|
|
indexMapping.StoreDynamic = false
|
|
indexMapping.DocValuesDynamic = false
|
|
contentFieldMapping := NewTextFieldMapping()
|
|
contentFieldMapping.Store = false
|
|
|
|
reviewsMapping := NewDocumentMapping()
|
|
reviewsMapping.AddFieldMappingsAt("content", contentFieldMapping)
|
|
documentMapping.AddSubDocumentMapping("reviews", reviewsMapping)
|
|
|
|
typeFieldMapping := NewTextFieldMapping()
|
|
typeFieldMapping.Store = false
|
|
documentMapping.AddFieldMappingsAt("type", typeFieldMapping)
|
|
|
|
return indexMapping
|
|
}
|
|
|
|
func TestBM25TFIDFScoring(t *testing.T) {
|
|
tmpIndexPath1 := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath1)
|
|
tmpIndexPath2 := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath2)
|
|
|
|
indexMapping := createIndexMappingOnSampleData()
|
|
indexMapping.ScoringModel = index.BM25Scoring
|
|
indexBM25, err := NewUsing(tmpIndexPath1, indexMapping, Config.DefaultIndexType, Config.DefaultMemKVStore, nil)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
indexMapping1 := createIndexMappingOnSampleData()
|
|
indexTFIDF, err := NewUsing(tmpIndexPath2, indexMapping1, Config.DefaultIndexType, Config.DefaultMemKVStore, nil)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
defer func() {
|
|
err := indexBM25.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
err = indexTFIDF.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}()
|
|
|
|
batch, err := getBatchFromData(indexBM25, "sample-data.json")
|
|
if err != nil {
|
|
t.Fatalf("failed to form a batch")
|
|
}
|
|
err = indexBM25.Batch(batch)
|
|
if err != nil {
|
|
t.Fatalf("failed to index batch %v\n", err)
|
|
}
|
|
query := NewMatchQuery("Hotel")
|
|
query.FieldVal = "name"
|
|
searchRequest := NewSearchRequestOptions(query, int(10), 0, true)
|
|
|
|
resBM25, err := indexBM25.Search(searchRequest)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
batch, err = getBatchFromData(indexTFIDF, "sample-data.json")
|
|
if err != nil {
|
|
t.Fatalf("failed to form a batch")
|
|
}
|
|
err = indexTFIDF.Batch(batch)
|
|
if err != nil {
|
|
t.Fatalf("failed to index batch %v\n", err)
|
|
}
|
|
|
|
resTFIDF, err := indexTFIDF.Search(searchRequest)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
for i, hit := range resTFIDF.Hits {
|
|
if hit.Score < resBM25.Hits[i].Score {
|
|
t.Fatalf("expected the score to be higher for BM25, got %v and %v",
|
|
resBM25.Hits[i].Score, hit.Score)
|
|
}
|
|
}
|
|
}
|
|
|
|
func TestBM25GlobalScoring(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
indexMapping := createIndexMappingOnSampleData()
|
|
indexMapping.ScoringModel = index.BM25Scoring
|
|
idxSinglePartition, err := NewUsing(tmpIndexPath, indexMapping, Config.DefaultIndexType, Config.DefaultMemKVStore, nil)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
defer func() {
|
|
err := idxSinglePartition.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}()
|
|
|
|
batch, err := getBatchFromData(idxSinglePartition, "sample-data.json")
|
|
if err != nil {
|
|
t.Fatalf("failed to form a batch")
|
|
}
|
|
err = idxSinglePartition.Batch(batch)
|
|
if err != nil {
|
|
t.Fatalf("failed to index batch %v\n", err)
|
|
}
|
|
query := NewMatchQuery("Hotel")
|
|
query.FieldVal = "name"
|
|
searchRequest := NewSearchRequestOptions(query, int(10), 0, true)
|
|
|
|
res, err := idxSinglePartition.Search(searchRequest)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
singlePartHits := res.Hits
|
|
|
|
dataset, _ := readDataFromFile("sample-data.json")
|
|
tmpIndexPath1 := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath1)
|
|
|
|
idxPart1, err := NewUsing(tmpIndexPath1, indexMapping, Config.DefaultIndexType, Config.DefaultMemKVStore, nil)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
defer func() {
|
|
err := idxPart1.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}()
|
|
|
|
batch1 := idxPart1.NewBatch()
|
|
for _, doc := range dataset[:len(dataset)/2] {
|
|
err = batch1.Index(fmt.Sprintf("%d", doc["id"]), doc)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
err = idxPart1.Batch(batch1)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
tmpIndexPath2 := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath2)
|
|
|
|
idxPart2, err := NewUsing(tmpIndexPath2, indexMapping, Config.DefaultIndexType, Config.DefaultMemKVStore, nil)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
defer func() {
|
|
err := idxPart2.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}()
|
|
|
|
batch2 := idxPart2.NewBatch()
|
|
for _, doc := range dataset[len(dataset)/2:] {
|
|
err = batch2.Index(fmt.Sprintf("%d", doc["id"]), doc)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
err = idxPart2.Batch(batch2)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
multiPartIndex := NewIndexAlias(idxPart1, idxPart2)
|
|
err = multiPartIndex.SetIndexMapping(indexMapping)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
ctx := context.Background()
|
|
// this key is set to ensure that we have a consistent scoring at the index alias
|
|
// level (it forces a pre search phase which can have a small overhead)
|
|
ctx = context.WithValue(ctx, search.SearchTypeKey, search.GlobalScoring)
|
|
|
|
res, err = multiPartIndex.SearchInContext(ctx, searchRequest)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
for i, hit := range res.Hits {
|
|
if hit.Score != singlePartHits[i].Score {
|
|
t.Fatalf("expected the scores to be the same, got %v and %v",
|
|
hit.Score, singlePartHits[i].Score)
|
|
}
|
|
}
|
|
}
|
|
|
|
func TestBytesRead(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
indexMapping := NewIndexMapping()
|
|
indexMapping.TypeField = "type"
|
|
indexMapping.DefaultAnalyzer = "en"
|
|
documentMapping := NewDocumentMapping()
|
|
indexMapping.AddDocumentMapping("hotel", documentMapping)
|
|
indexMapping.StoreDynamic = false
|
|
indexMapping.DocValuesDynamic = false
|
|
contentFieldMapping := NewTextFieldMapping()
|
|
contentFieldMapping.Store = false
|
|
|
|
reviewsMapping := NewDocumentMapping()
|
|
reviewsMapping.AddFieldMappingsAt("content", contentFieldMapping)
|
|
documentMapping.AddSubDocumentMapping("reviews", reviewsMapping)
|
|
|
|
typeFieldMapping := NewTextFieldMapping()
|
|
typeFieldMapping.Store = false
|
|
documentMapping.AddFieldMappingsAt("type", typeFieldMapping)
|
|
|
|
idx, err := NewUsing(tmpIndexPath, indexMapping, Config.DefaultIndexType, Config.DefaultMemKVStore, nil)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
defer func() {
|
|
err := idx.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}()
|
|
|
|
batch, err := getBatchFromData(idx, "sample-data.json")
|
|
if err != nil {
|
|
t.Fatalf("failed to form a batch")
|
|
}
|
|
err = idx.Batch(batch)
|
|
if err != nil {
|
|
t.Fatalf("failed to index batch %v\n", err)
|
|
}
|
|
query := NewQueryStringQuery("united")
|
|
searchRequest := NewSearchRequestOptions(query, int(10), 0, true)
|
|
|
|
res, err := idx.Search(searchRequest)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
stats, _ := idx.StatsMap()["index"].(map[string]interface{})
|
|
prevBytesRead, _ := stats["num_bytes_read_at_query_time"].(uint64)
|
|
|
|
expectedBytesRead := uint64(22049)
|
|
if supportForVectorSearch {
|
|
expectedBytesRead = 22459
|
|
}
|
|
|
|
if prevBytesRead != expectedBytesRead && res.Cost == prevBytesRead {
|
|
t.Fatalf("expected bytes read for query string %v, got %v",
|
|
expectedBytesRead, prevBytesRead)
|
|
}
|
|
|
|
// subsequent queries on the same field results in lesser amount
|
|
// of bytes read because the segment static and dictionary is reused and not
|
|
// loaded from mmap'd filed
|
|
res, err = idx.Search(searchRequest)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
stats, _ = idx.StatsMap()["index"].(map[string]interface{})
|
|
bytesRead, _ := stats["num_bytes_read_at_query_time"].(uint64)
|
|
if bytesRead-prevBytesRead != 66 && res.Cost == bytesRead-prevBytesRead {
|
|
t.Fatalf("expected bytes read for query string 66, got %v",
|
|
bytesRead-prevBytesRead)
|
|
}
|
|
prevBytesRead = bytesRead
|
|
|
|
fuzz := NewFuzzyQuery("hotel")
|
|
fuzz.FieldVal = "reviews.content"
|
|
fuzz.Fuzziness = 2
|
|
searchRequest = NewSearchRequest(fuzz)
|
|
res, err = idx.Search(searchRequest)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
stats, _ = idx.StatsMap()["index"].(map[string]interface{})
|
|
bytesRead, _ = stats["num_bytes_read_at_query_time"].(uint64)
|
|
if bytesRead-prevBytesRead != 8468 && res.Cost == bytesRead-prevBytesRead {
|
|
t.Fatalf("expected bytes read for fuzzy query is 8468, got %v",
|
|
bytesRead-prevBytesRead)
|
|
}
|
|
prevBytesRead = bytesRead
|
|
|
|
typeFacet := NewFacetRequest("type", 2)
|
|
query = NewQueryStringQuery("united")
|
|
searchRequest = NewSearchRequestOptions(query, int(0), 0, true)
|
|
searchRequest.AddFacet("types", typeFacet)
|
|
res, err = idx.Search(searchRequest)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
stats, _ = idx.StatsMap()["index"].(map[string]interface{})
|
|
bytesRead, _ = stats["num_bytes_read_at_query_time"].(uint64)
|
|
if !approxSame(bytesRead-prevBytesRead, 196) && res.Cost == bytesRead-prevBytesRead {
|
|
t.Fatalf("expected bytes read for faceted query is around 196, got %v",
|
|
bytesRead-prevBytesRead)
|
|
}
|
|
prevBytesRead = bytesRead
|
|
|
|
min := float64(8660)
|
|
max := float64(8665)
|
|
numRangeQuery := NewNumericRangeQuery(&min, &max)
|
|
numRangeQuery.FieldVal = "id"
|
|
searchRequest = NewSearchRequestOptions(numRangeQuery, int(10), 0, true)
|
|
res, err = idx.Search(searchRequest)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
stats, _ = idx.StatsMap()["index"].(map[string]interface{})
|
|
bytesRead, _ = stats["num_bytes_read_at_query_time"].(uint64)
|
|
if bytesRead-prevBytesRead != 924 && res.Cost == bytesRead-prevBytesRead {
|
|
t.Fatalf("expected bytes read for numeric range query is 924, got %v",
|
|
bytesRead-prevBytesRead)
|
|
}
|
|
prevBytesRead = bytesRead
|
|
|
|
searchRequest = NewSearchRequestOptions(query, int(10), 0, true)
|
|
searchRequest.Highlight = &HighlightRequest{}
|
|
res, err = idx.Search(searchRequest)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
stats, _ = idx.StatsMap()["index"].(map[string]interface{})
|
|
bytesRead, _ = stats["num_bytes_read_at_query_time"].(uint64)
|
|
if bytesRead-prevBytesRead != 105 && res.Cost == bytesRead-prevBytesRead {
|
|
t.Fatalf("expected bytes read for query with highlighter is 105, got %v",
|
|
bytesRead-prevBytesRead)
|
|
}
|
|
prevBytesRead = bytesRead
|
|
|
|
disQuery := NewDisjunctionQuery(NewMatchQuery("hotel"), NewMatchQuery("united"))
|
|
searchRequest = NewSearchRequestOptions(disQuery, int(10), 0, true)
|
|
res, err = idx.Search(searchRequest)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
// expectation is that the bytes read is roughly equal to sum of sub queries in
|
|
// the disjunction query plus the segment loading portion for the second subquery
|
|
// since it's created afresh and not reused
|
|
stats, _ = idx.StatsMap()["index"].(map[string]interface{})
|
|
bytesRead, _ = stats["num_bytes_read_at_query_time"].(uint64)
|
|
if bytesRead-prevBytesRead != 120 && res.Cost == bytesRead-prevBytesRead {
|
|
t.Fatalf("expected bytes read for disjunction query is 120, got %v",
|
|
bytesRead-prevBytesRead)
|
|
}
|
|
}
|
|
|
|
func TestBytesReadStored(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
indexMapping := NewIndexMapping()
|
|
indexMapping.TypeField = "type"
|
|
indexMapping.DefaultAnalyzer = "en"
|
|
documentMapping := NewDocumentMapping()
|
|
indexMapping.AddDocumentMapping("hotel", documentMapping)
|
|
|
|
indexMapping.DocValuesDynamic = false
|
|
indexMapping.StoreDynamic = false
|
|
|
|
contentFieldMapping := NewTextFieldMapping()
|
|
contentFieldMapping.Store = true
|
|
contentFieldMapping.IncludeInAll = false
|
|
contentFieldMapping.IncludeTermVectors = false
|
|
|
|
reviewsMapping := NewDocumentMapping()
|
|
reviewsMapping.AddFieldMappingsAt("content", contentFieldMapping)
|
|
documentMapping.AddSubDocumentMapping("reviews", reviewsMapping)
|
|
|
|
typeFieldMapping := NewTextFieldMapping()
|
|
typeFieldMapping.Store = false
|
|
typeFieldMapping.IncludeInAll = false
|
|
typeFieldMapping.IncludeTermVectors = false
|
|
documentMapping.AddFieldMappingsAt("type", typeFieldMapping)
|
|
idx, err := NewUsing(tmpIndexPath, indexMapping, Config.DefaultIndexType, Config.DefaultMemKVStore, nil)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
batch, err := getBatchFromData(idx, "sample-data.json")
|
|
if err != nil {
|
|
t.Fatalf("failed to form a batch %v\n", err)
|
|
}
|
|
err = idx.Batch(batch)
|
|
if err != nil {
|
|
t.Fatalf("failed to index batch %v\n", err)
|
|
}
|
|
query := NewTermQuery("hotel")
|
|
query.FieldVal = "reviews.content"
|
|
searchRequest := NewSearchRequestOptions(query, int(10), 0, true)
|
|
res, err := idx.Search(searchRequest)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
stats, _ := idx.StatsMap()["index"].(map[string]interface{})
|
|
bytesRead, _ := stats["num_bytes_read_at_query_time"].(uint64)
|
|
|
|
expectedBytesRead := uint64(11911)
|
|
if supportForVectorSearch {
|
|
expectedBytesRead = 12321
|
|
}
|
|
|
|
if bytesRead != expectedBytesRead && bytesRead == res.Cost {
|
|
t.Fatalf("expected the bytes read stat to be around %v, got %v", expectedBytesRead, bytesRead)
|
|
}
|
|
prevBytesRead := bytesRead
|
|
|
|
searchRequest = NewSearchRequestOptions(query, int(10), 0, true)
|
|
res, err = idx.Search(searchRequest)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
stats, _ = idx.StatsMap()["index"].(map[string]interface{})
|
|
bytesRead, _ = stats["num_bytes_read_at_query_time"].(uint64)
|
|
if bytesRead-prevBytesRead != 48 && bytesRead-prevBytesRead == res.Cost {
|
|
t.Fatalf("expected the bytes read stat to be around 48, got %v", bytesRead-prevBytesRead)
|
|
}
|
|
prevBytesRead = bytesRead
|
|
|
|
searchRequest = NewSearchRequestOptions(query, int(10), 0, true)
|
|
searchRequest.Fields = []string{"*"}
|
|
res, err = idx.Search(searchRequest)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
stats, _ = idx.StatsMap()["index"].(map[string]interface{})
|
|
bytesRead, _ = stats["num_bytes_read_at_query_time"].(uint64)
|
|
|
|
if bytesRead-prevBytesRead != 26511 && bytesRead-prevBytesRead == res.Cost {
|
|
t.Fatalf("expected the bytes read stat to be around 26511, got %v",
|
|
bytesRead-prevBytesRead)
|
|
}
|
|
idx.Close()
|
|
cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
// same type of querying but on field "type"
|
|
contentFieldMapping.Store = false
|
|
typeFieldMapping.Store = true
|
|
|
|
tmpIndexPath1 := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath1)
|
|
|
|
idx1, err := NewUsing(tmpIndexPath1, indexMapping, Config.DefaultIndexType, Config.DefaultMemKVStore, nil)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
defer func() {
|
|
err := idx1.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}()
|
|
|
|
batch, err = getBatchFromData(idx1, "sample-data.json")
|
|
if err != nil {
|
|
t.Fatalf("failed to form a batch %v\n", err)
|
|
}
|
|
err = idx1.Batch(batch)
|
|
if err != nil {
|
|
t.Fatalf("failed to index batch %v\n", err)
|
|
}
|
|
|
|
query = NewTermQuery("hotel")
|
|
query.FieldVal = "type"
|
|
searchRequest = NewSearchRequestOptions(query, int(10), 0, true)
|
|
res, err = idx1.Search(searchRequest)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
stats, _ = idx1.StatsMap()["index"].(map[string]interface{})
|
|
bytesRead, _ = stats["num_bytes_read_at_query_time"].(uint64)
|
|
|
|
expectedBytesRead = uint64(4097)
|
|
if supportForVectorSearch {
|
|
expectedBytesRead = 4507
|
|
}
|
|
|
|
if bytesRead != expectedBytesRead && bytesRead == res.Cost {
|
|
t.Fatalf("expected the bytes read stat to be around %v, got %v", expectedBytesRead, bytesRead)
|
|
}
|
|
prevBytesRead = bytesRead
|
|
|
|
res, err = idx1.Search(searchRequest)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
stats, _ = idx1.StatsMap()["index"].(map[string]interface{})
|
|
bytesRead, _ = stats["num_bytes_read_at_query_time"].(uint64)
|
|
if bytesRead-prevBytesRead != 47 && bytesRead-prevBytesRead == res.Cost {
|
|
t.Fatalf("expected the bytes read stat to be around 47, got %v", bytesRead-prevBytesRead)
|
|
}
|
|
prevBytesRead = bytesRead
|
|
|
|
searchRequest.Fields = []string{"*"}
|
|
res, err = idx1.Search(searchRequest)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
stats, _ = idx1.StatsMap()["index"].(map[string]interface{})
|
|
bytesRead, _ = stats["num_bytes_read_at_query_time"].(uint64)
|
|
if bytesRead-prevBytesRead != 77 && bytesRead-prevBytesRead == res.Cost {
|
|
t.Fatalf("expected the bytes read stat to be around 77, got %v", bytesRead-prevBytesRead)
|
|
}
|
|
}
|
|
|
|
func readDataFromFile(fileName string) ([]map[string]interface{}, error) {
|
|
pwd, err := os.Getwd()
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
path := filepath.Join(pwd, "data", "test", fileName)
|
|
|
|
var dataset []map[string]interface{}
|
|
fileContent, err := os.ReadFile(path)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
err = json.Unmarshal(fileContent, &dataset)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
return dataset, nil
|
|
}
|
|
|
|
func getBatchFromData(idx Index, fileName string) (*Batch, error) {
|
|
dataset, err := readDataFromFile(fileName)
|
|
batch := idx.NewBatch()
|
|
for _, doc := range dataset {
|
|
err = batch.Index(fmt.Sprintf("%d", doc["id"]), doc)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
}
|
|
|
|
return batch, err
|
|
}
|
|
|
|
func TestIndexCreateNewOverExisting(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
|
|
index, err := New(tmpIndexPath, NewIndexMapping())
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
err = index.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
_, err = New(tmpIndexPath, NewIndexMapping())
|
|
if err != ErrorIndexPathExists {
|
|
t.Fatalf("expected error index path exists, got %v", err)
|
|
}
|
|
}
|
|
|
|
func TestIndexOpenNonExisting(t *testing.T) {
|
|
_, err := Open("doesnotexist")
|
|
if err != ErrorIndexPathDoesNotExist {
|
|
t.Fatalf("expected error index path does not exist, got %v", err)
|
|
}
|
|
}
|
|
|
|
func TestIndexOpenMetaMissingOrCorrupt(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
index, err := New(tmpIndexPath, NewIndexMapping())
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
err = index.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
tmpIndexPathMeta := filepath.Join(tmpIndexPath, "index_meta.json")
|
|
|
|
// now intentionally change the storage type
|
|
err = os.WriteFile(tmpIndexPathMeta, []byte(`{"storage":"mystery"}`), 0o666)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
_, err = Open(tmpIndexPath)
|
|
if err == nil {
|
|
t.Fatalf("expected error for unknown storage type, got %v", err)
|
|
}
|
|
|
|
// now intentionally corrupt the metadata
|
|
err = os.WriteFile(tmpIndexPathMeta, []byte("corrupted"), 0o666)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
_, err = Open(tmpIndexPath)
|
|
if err != ErrorIndexMetaCorrupt {
|
|
t.Fatalf("expected error index metadata corrupted, got %v", err)
|
|
}
|
|
|
|
// now intentionally remove the metadata
|
|
err = os.Remove(tmpIndexPathMeta)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
_, err = Open(tmpIndexPath)
|
|
if err != ErrorIndexMetaMissing {
|
|
t.Fatalf("expected error index metadata missing, got %v", err)
|
|
}
|
|
}
|
|
|
|
func TestInMemIndex(t *testing.T) {
|
|
index, err := NewMemOnly(NewIndexMapping())
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
err = index.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
|
|
func TestClosedIndex(t *testing.T) {
|
|
index, err := NewMemOnly(NewIndexMapping())
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
err = index.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
err = index.Index("test", "test")
|
|
if err != ErrorIndexClosed {
|
|
t.Errorf("expected error index closed, got %v", err)
|
|
}
|
|
|
|
err = index.Delete("test")
|
|
if err != ErrorIndexClosed {
|
|
t.Errorf("expected error index closed, got %v", err)
|
|
}
|
|
|
|
b := index.NewBatch()
|
|
err = index.Batch(b)
|
|
if err != ErrorIndexClosed {
|
|
t.Errorf("expected error index closed, got %v", err)
|
|
}
|
|
|
|
_, err = index.Document("test")
|
|
if err != ErrorIndexClosed {
|
|
t.Errorf("expected error index closed, got %v", err)
|
|
}
|
|
|
|
_, err = index.DocCount()
|
|
if err != ErrorIndexClosed {
|
|
t.Errorf("expected error index closed, got %v", err)
|
|
}
|
|
|
|
_, err = index.Search(NewSearchRequest(NewTermQuery("test")))
|
|
if err != ErrorIndexClosed {
|
|
t.Errorf("expected error index closed, got %v", err)
|
|
}
|
|
|
|
_, err = index.Fields()
|
|
if err != ErrorIndexClosed {
|
|
t.Errorf("expected error index closed, got %v", err)
|
|
}
|
|
}
|
|
|
|
type slowQuery struct {
|
|
actual query.Query
|
|
delay time.Duration
|
|
}
|
|
|
|
func (s *slowQuery) Searcher(ctx context.Context, i index.IndexReader, m mapping.IndexMapping, options search.SearcherOptions) (search.Searcher, error) {
|
|
time.Sleep(s.delay)
|
|
return s.actual.Searcher(ctx, i, m, options)
|
|
}
|
|
|
|
func TestSlowSearch(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
defer func() {
|
|
// reset logger back to normal
|
|
SetLog(log.New(io.Discard, "bleve", log.LstdFlags))
|
|
}()
|
|
// set custom logger
|
|
var sdw sawDataWriter
|
|
SetLog(log.New(&sdw, "bleve", log.LstdFlags))
|
|
|
|
index, err := New(tmpIndexPath, NewIndexMapping())
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
defer func() {
|
|
err := index.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}()
|
|
|
|
Config.SlowSearchLogThreshold = 1 * time.Minute
|
|
|
|
query := NewTermQuery("water")
|
|
req := NewSearchRequest(query)
|
|
_, err = index.Search(req)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
if sdw.sawData {
|
|
t.Errorf("expected to not see slow query logged, but did")
|
|
}
|
|
|
|
sq := &slowQuery{
|
|
actual: query,
|
|
delay: 50 * time.Millisecond, // on Windows timer resolution is 15ms
|
|
}
|
|
req.Query = sq
|
|
Config.SlowSearchLogThreshold = 1 * time.Microsecond
|
|
_, err = index.Search(req)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
if !sdw.sawData {
|
|
t.Errorf("expected to see slow query logged, but didn't")
|
|
}
|
|
}
|
|
|
|
type sawDataWriter struct {
|
|
sawData bool
|
|
}
|
|
|
|
func (s *sawDataWriter) Write(p []byte) (n int, err error) {
|
|
s.sawData = true
|
|
return len(p), nil
|
|
}
|
|
|
|
func TestStoredFieldPreserved(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
index, err := New(tmpIndexPath, NewIndexMapping())
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
defer func() {
|
|
err := index.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}()
|
|
|
|
doca := map[string]interface{}{
|
|
"name": "Marty",
|
|
"desc": "GopherCON India",
|
|
"bool": true,
|
|
"num": float64(1),
|
|
}
|
|
err = index.Index("a", doca)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
q := NewTermQuery("marty")
|
|
req := NewSearchRequest(q)
|
|
req.Fields = []string{"name", "desc", "bool", "num"}
|
|
res, err := index.Search(req)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
if len(res.Hits) != 1 {
|
|
t.Fatalf("expected 1 hit, got %d", len(res.Hits))
|
|
}
|
|
if res.Hits[0].Fields["name"] != "Marty" {
|
|
t.Errorf("expected 'Marty' got '%s'", res.Hits[0].Fields["name"])
|
|
}
|
|
if res.Hits[0].Fields["desc"] != "GopherCON India" {
|
|
t.Errorf("expected 'GopherCON India' got '%s'", res.Hits[0].Fields["desc"])
|
|
}
|
|
if res.Hits[0].Fields["num"] != float64(1) {
|
|
t.Errorf("expected '1' got '%v'", res.Hits[0].Fields["num"])
|
|
}
|
|
if res.Hits[0].Fields["bool"] != true {
|
|
t.Errorf("expected 'true' got '%v'", res.Hits[0].Fields["bool"])
|
|
}
|
|
}
|
|
|
|
func TestDict(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
index, err := New(tmpIndexPath, NewIndexMapping())
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
doca := map[string]interface{}{
|
|
"name": "marty",
|
|
"desc": "gophercon india",
|
|
}
|
|
err = index.Index("a", doca)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
docy := map[string]interface{}{
|
|
"name": "jasper",
|
|
"desc": "clojure",
|
|
}
|
|
err = index.Index("y", docy)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
docx := map[string]interface{}{
|
|
"name": "rose",
|
|
"desc": "googler",
|
|
}
|
|
err = index.Index("x", docx)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
dict, err := index.FieldDict("name")
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
terms := []string{}
|
|
de, err := dict.Next()
|
|
for err == nil && de != nil {
|
|
terms = append(terms, string(de.Term))
|
|
de, err = dict.Next()
|
|
}
|
|
|
|
expectedTerms := []string{"jasper", "marty", "rose"}
|
|
if !reflect.DeepEqual(terms, expectedTerms) {
|
|
t.Errorf("expected %v, got %v", expectedTerms, terms)
|
|
}
|
|
|
|
err = dict.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
// test start and end range
|
|
dict, err = index.FieldDictRange("name", []byte("marty"), []byte("rose"))
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
terms = []string{}
|
|
de, err = dict.Next()
|
|
for err == nil && de != nil {
|
|
terms = append(terms, string(de.Term))
|
|
de, err = dict.Next()
|
|
}
|
|
|
|
expectedTerms = []string{"marty", "rose"}
|
|
if !reflect.DeepEqual(terms, expectedTerms) {
|
|
t.Errorf("expected %v, got %v", expectedTerms, terms)
|
|
}
|
|
|
|
err = dict.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
docz := map[string]interface{}{
|
|
"name": "prefix",
|
|
"desc": "bob cat cats catting dog doggy zoo",
|
|
}
|
|
err = index.Index("z", docz)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
dict, err = index.FieldDictPrefix("desc", []byte("cat"))
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
terms = []string{}
|
|
de, err = dict.Next()
|
|
for err == nil && de != nil {
|
|
terms = append(terms, string(de.Term))
|
|
de, err = dict.Next()
|
|
}
|
|
|
|
expectedTerms = []string{"cat", "cats", "catting"}
|
|
if !reflect.DeepEqual(terms, expectedTerms) {
|
|
t.Errorf("expected %v, got %v", expectedTerms, terms)
|
|
}
|
|
|
|
stats := index.Stats()
|
|
if stats == nil {
|
|
t.Errorf("expected IndexStat, got nil")
|
|
}
|
|
|
|
err = dict.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
err = index.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
|
|
func TestBatchString(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
index, err := New(tmpIndexPath, NewIndexMapping())
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
defer func() {
|
|
err := index.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}()
|
|
|
|
batch := index.NewBatch()
|
|
err = batch.Index("a", []byte("{}"))
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
batch.Delete("b")
|
|
batch.SetInternal([]byte("c"), []byte{})
|
|
batch.DeleteInternal([]byte("d"))
|
|
|
|
batchStr := batch.String()
|
|
if !strings.HasPrefix(batchStr, "Batch (2 ops, 2 internal ops)") {
|
|
t.Errorf("expected to start with Batch (2 ops, 2 internal ops), did not")
|
|
}
|
|
if !strings.Contains(batchStr, "INDEX - 'a'") {
|
|
t.Errorf("expected to contain INDEX - 'a', did not")
|
|
}
|
|
if !strings.Contains(batchStr, "DELETE - 'b'") {
|
|
t.Errorf("expected to contain DELETE - 'b', did not")
|
|
}
|
|
if !strings.Contains(batchStr, "SET INTERNAL - 'c'") {
|
|
t.Errorf("expected to contain SET INTERNAL - 'c', did not")
|
|
}
|
|
if !strings.Contains(batchStr, "DELETE INTERNAL - 'd'") {
|
|
t.Errorf("expected to contain DELETE INTERNAL - 'd', did not")
|
|
}
|
|
}
|
|
|
|
func TestIndexMetadataRaceBug198(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
index, err := New(tmpIndexPath, NewIndexMapping())
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
defer func() {
|
|
err := index.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}()
|
|
|
|
wg := sync.WaitGroup{}
|
|
wg.Add(1)
|
|
done := make(chan struct{})
|
|
go func() {
|
|
for {
|
|
select {
|
|
case <-done:
|
|
wg.Done()
|
|
return
|
|
default:
|
|
_, err2 := index.DocCount()
|
|
if err2 != nil {
|
|
t.Error(err2)
|
|
wg.Done()
|
|
return
|
|
}
|
|
}
|
|
}
|
|
}()
|
|
|
|
for i := 0; i < 100; i++ {
|
|
batch := index.NewBatch()
|
|
err = batch.Index("a", []byte("{}"))
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
err = index.Batch(batch)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
|
|
close(done)
|
|
wg.Wait()
|
|
}
|
|
|
|
func TestSortMatchSearch(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
index, err := New(tmpIndexPath, NewIndexMapping())
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
names := []string{"Noam", "Uri", "David", "Yosef", "Eitan", "Itay", "Ariel", "Daniel", "Omer", "Yogev", "Yehonatan", "Moshe", "Mohammed", "Yusuf", "Omar"}
|
|
days := []string{"Sunday", "Monday", "Tuesday", "Wednesday", "Thursday", "Friday", "Saturday"}
|
|
numbers := []string{"One", "Two", "Three", "Four", "Five", "Six", "Seven", "Eight", "Nine", "Ten", "Eleven", "Twelve"}
|
|
b := index.NewBatch()
|
|
for i := 0; i < 200; i++ {
|
|
doc := make(map[string]interface{})
|
|
doc["Name"] = names[i%len(names)]
|
|
doc["Day"] = days[i%len(days)]
|
|
doc["Number"] = numbers[i%len(numbers)]
|
|
err = b.Index(fmt.Sprintf("%d", i), doc)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
err = index.Batch(b)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
req := NewSearchRequest(NewMatchQuery("One"))
|
|
req.SortBy([]string{"Day", "Name"})
|
|
req.Fields = []string{"*"}
|
|
sr, err := index.Search(req)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
prev := ""
|
|
for _, hit := range sr.Hits {
|
|
val := hit.Fields["Day"].(string)
|
|
if prev > val {
|
|
t.Errorf("Hits must be sorted by 'Day'. Found '%s' before '%s'", prev, val)
|
|
}
|
|
prev = val
|
|
}
|
|
err = index.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
|
|
func TestIndexCountMatchSearch(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
index, err := New(tmpIndexPath, NewIndexMapping())
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
var wg sync.WaitGroup
|
|
for i := 0; i < 10; i++ {
|
|
wg.Add(1)
|
|
go func(i int) {
|
|
b := index.NewBatch()
|
|
for j := 0; j < 200; j++ {
|
|
id := fmt.Sprintf("%d", (i*200)+j)
|
|
|
|
doc := struct {
|
|
Body string
|
|
}{
|
|
Body: "match",
|
|
}
|
|
|
|
err := b.Index(id, doc)
|
|
if err != nil {
|
|
t.Error(err)
|
|
wg.Done()
|
|
return
|
|
}
|
|
}
|
|
|
|
err := index.Batch(b)
|
|
if err != nil {
|
|
t.Error(err)
|
|
wg.Done()
|
|
return
|
|
}
|
|
|
|
wg.Done()
|
|
}(i)
|
|
}
|
|
wg.Wait()
|
|
|
|
// search for something that should match all documents
|
|
sr, err := index.Search(NewSearchRequest(NewMatchQuery("match")))
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
// get the index document count
|
|
dc, err := index.DocCount()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
// make sure test is working correctly, doc count should 2000
|
|
if dc != 2000 {
|
|
t.Errorf("expected doc count 2000, got %d", dc)
|
|
}
|
|
|
|
// make sure our search found all the documents
|
|
if dc != sr.Total {
|
|
t.Errorf("expected search result total %d to match doc count %d", sr.Total, dc)
|
|
}
|
|
|
|
err = index.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
|
|
func TestBatchReset(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
index, err := New(tmpIndexPath, NewIndexMapping())
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
batch := index.NewBatch()
|
|
err = batch.Index("k1", struct {
|
|
Body string
|
|
}{
|
|
Body: "v1",
|
|
})
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
batch.Delete("k2")
|
|
batch.SetInternal([]byte("k3"), []byte("v3"))
|
|
batch.DeleteInternal([]byte("k4"))
|
|
|
|
if batch.Size() != 4 {
|
|
t.Logf("%v", batch)
|
|
t.Errorf("expected batch size 4, got %d", batch.Size())
|
|
}
|
|
|
|
batch.Reset()
|
|
|
|
if batch.Size() != 0 {
|
|
t.Errorf("expected batch size 0 after reset, got %d", batch.Size())
|
|
}
|
|
|
|
err = index.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
|
|
func TestDocumentFieldArrayPositions(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
idx, err := New(tmpIndexPath, NewIndexMapping())
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
// index a document with an array of strings
|
|
err = idx.Index("k", struct {
|
|
Messages []string
|
|
}{
|
|
Messages: []string{
|
|
"first",
|
|
"second",
|
|
"third",
|
|
"last",
|
|
},
|
|
})
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
// load the document
|
|
doc, err := idx.Document("k")
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
doc.VisitFields(func(f index.Field) {
|
|
if reflect.DeepEqual(f.Value(), []byte("first")) {
|
|
ap := f.ArrayPositions()
|
|
if len(ap) < 1 {
|
|
t.Errorf("expected an array position, got none")
|
|
return
|
|
}
|
|
if ap[0] != 0 {
|
|
t.Errorf("expected 'first' in array position 0, got %d", ap[0])
|
|
}
|
|
}
|
|
if reflect.DeepEqual(f.Value(), []byte("second")) {
|
|
ap := f.ArrayPositions()
|
|
if len(ap) < 1 {
|
|
t.Errorf("expected an array position, got none")
|
|
return
|
|
}
|
|
if ap[0] != 1 {
|
|
t.Errorf("expected 'second' in array position 1, got %d", ap[0])
|
|
}
|
|
}
|
|
if reflect.DeepEqual(f.Value(), []byte("third")) {
|
|
ap := f.ArrayPositions()
|
|
if len(ap) < 1 {
|
|
t.Errorf("expected an array position, got none")
|
|
return
|
|
}
|
|
if ap[0] != 2 {
|
|
t.Errorf("expected 'third' in array position 2, got %d", ap[0])
|
|
}
|
|
}
|
|
if reflect.DeepEqual(f.Value(), []byte("last")) {
|
|
ap := f.ArrayPositions()
|
|
if len(ap) < 1 {
|
|
t.Errorf("expected an array position, got none")
|
|
return
|
|
}
|
|
if ap[0] != 3 {
|
|
t.Errorf("expected 'last' in array position 3, got %d", ap[0])
|
|
}
|
|
}
|
|
})
|
|
|
|
// now index a document in the same field with a single string
|
|
err = idx.Index("k2", struct {
|
|
Messages string
|
|
}{
|
|
Messages: "only",
|
|
})
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
// load the document
|
|
doc, err = idx.Document("k2")
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
doc.VisitFields(func(f index.Field) {
|
|
if reflect.DeepEqual(f.Value(), []byte("only")) {
|
|
ap := f.ArrayPositions()
|
|
if len(ap) != 0 {
|
|
t.Errorf("expected no array positions, got %d", len(ap))
|
|
return
|
|
}
|
|
}
|
|
})
|
|
|
|
err = idx.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
|
|
func TestKeywordSearchBug207(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
f := NewTextFieldMapping()
|
|
f.Analyzer = keyword.Name
|
|
|
|
m := NewIndexMapping()
|
|
m.DefaultMapping = NewDocumentMapping()
|
|
m.DefaultMapping.AddFieldMappingsAt("Body", f)
|
|
|
|
index, err := New(tmpIndexPath, m)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
doc1 := struct {
|
|
Body string
|
|
}{
|
|
Body: "a555c3bb06f7a127cda000005",
|
|
}
|
|
|
|
err = index.Index("a", doc1)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
doc2 := struct {
|
|
Body string
|
|
}{
|
|
Body: "555c3bb06f7a127cda000005",
|
|
}
|
|
|
|
err = index.Index("b", doc2)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
// now search for these terms
|
|
sreq := NewSearchRequest(NewTermQuery("a555c3bb06f7a127cda000005"))
|
|
sres, err := index.Search(sreq)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if sres.Total != 1 {
|
|
t.Errorf("expected 1 result, got %d", sres.Total)
|
|
}
|
|
if sres.Hits[0].ID != "a" {
|
|
t.Errorf("expecated id 'a', got '%s'", sres.Hits[0].ID)
|
|
}
|
|
|
|
sreq = NewSearchRequest(NewTermQuery("555c3bb06f7a127cda000005"))
|
|
sres, err = index.Search(sreq)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if sres.Total != 1 {
|
|
t.Errorf("expected 1 result, got %d", sres.Total)
|
|
}
|
|
if sres.Hits[0].ID != "b" {
|
|
t.Errorf("expecated id 'b', got '%s'", sres.Hits[0].ID)
|
|
}
|
|
|
|
// now do the same searches using query strings
|
|
sreq = NewSearchRequest(NewQueryStringQuery("Body:a555c3bb06f7a127cda000005"))
|
|
sres, err = index.Search(sreq)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if sres.Total != 1 {
|
|
t.Errorf("expected 1 result, got %d", sres.Total)
|
|
}
|
|
if sres.Hits[0].ID != "a" {
|
|
t.Errorf("expecated id 'a', got '%s'", sres.Hits[0].ID)
|
|
}
|
|
|
|
sreq = NewSearchRequest(NewQueryStringQuery(`Body:555c3bb06f7a127cda000005`))
|
|
sres, err = index.Search(sreq)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if sres.Total != 1 {
|
|
t.Errorf("expected 1 result, got %d", sres.Total)
|
|
}
|
|
if sres.Hits[0].ID != "b" {
|
|
t.Errorf("expecated id 'b', got '%s'", sres.Hits[0].ID)
|
|
}
|
|
|
|
err = index.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
|
|
func TestTermVectorArrayPositions(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
index, err := New(tmpIndexPath, NewIndexMapping())
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
// index a document with an array of strings
|
|
err = index.Index("k", struct {
|
|
Messages []string
|
|
}{
|
|
Messages: []string{
|
|
"first",
|
|
"second",
|
|
"third",
|
|
"last",
|
|
},
|
|
})
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
// search for this document in all field
|
|
tq := NewTermQuery("second")
|
|
tsr := NewSearchRequest(tq)
|
|
tsr.IncludeLocations = true
|
|
results, err := index.Search(tsr)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if results.Total != 1 {
|
|
t.Fatalf("expected 1 result, got %d", results.Total)
|
|
}
|
|
if len(results.Hits[0].Locations["Messages"]["second"]) < 1 {
|
|
t.Fatalf("expected at least one location")
|
|
}
|
|
if len(results.Hits[0].Locations["Messages"]["second"][0].ArrayPositions) < 1 {
|
|
t.Fatalf("expected at least one location array position")
|
|
}
|
|
if results.Hits[0].Locations["Messages"]["second"][0].ArrayPositions[0] != 1 {
|
|
t.Fatalf("expected array position 1, got %d", results.Hits[0].Locations["Messages"]["second"][0].ArrayPositions[0])
|
|
}
|
|
|
|
// repeat search for this document in Messages field
|
|
tq2 := NewTermQuery("third")
|
|
tq2.SetField("Messages")
|
|
tsr = NewSearchRequest(tq2)
|
|
tsr.IncludeLocations = true
|
|
results, err = index.Search(tsr)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if results.Total != 1 {
|
|
t.Fatalf("expected 1 result, got %d", results.Total)
|
|
}
|
|
if len(results.Hits[0].Locations["Messages"]["third"]) < 1 {
|
|
t.Fatalf("expected at least one location")
|
|
}
|
|
if len(results.Hits[0].Locations["Messages"]["third"][0].ArrayPositions) < 1 {
|
|
t.Fatalf("expected at least one location array position")
|
|
}
|
|
if results.Hits[0].Locations["Messages"]["third"][0].ArrayPositions[0] != 2 {
|
|
t.Fatalf("expected array position 2, got %d", results.Hits[0].Locations["Messages"]["third"][0].ArrayPositions[0])
|
|
}
|
|
|
|
err = index.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
|
|
func TestDocumentStaticMapping(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
m := NewIndexMapping()
|
|
m.DefaultMapping = NewDocumentStaticMapping()
|
|
m.DefaultMapping.AddFieldMappingsAt("Text", NewTextFieldMapping())
|
|
m.DefaultMapping.AddFieldMappingsAt("Date", NewDateTimeFieldMapping())
|
|
m.DefaultMapping.AddFieldMappingsAt("Numeric", NewNumericFieldMapping())
|
|
|
|
index, err := New(tmpIndexPath, m)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
doc1 := struct {
|
|
Text string
|
|
IgnoredText string
|
|
Numeric float64
|
|
IgnoredNumeric float64
|
|
Date time.Time
|
|
IgnoredDate time.Time
|
|
}{
|
|
Text: "valid text",
|
|
IgnoredText: "ignored text",
|
|
Numeric: 10,
|
|
IgnoredNumeric: 20,
|
|
Date: time.Unix(1, 0),
|
|
IgnoredDate: time.Unix(2, 0),
|
|
}
|
|
|
|
err = index.Index("a", doc1)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
fields, err := index.Fields()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
sort.Strings(fields)
|
|
expectedFields := []string{"Date", "Numeric", "Text", "_all"}
|
|
if len(fields) < len(expectedFields) {
|
|
t.Fatalf("invalid field count: %d", len(fields))
|
|
}
|
|
for i, expected := range expectedFields {
|
|
if expected != fields[i] {
|
|
t.Fatalf("unexpected field[%d]: %s", i, fields[i])
|
|
}
|
|
}
|
|
|
|
err = index.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
|
|
func TestIndexEmptyDocId(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
index, err := New(tmpIndexPath, NewIndexMapping())
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
defer func() {
|
|
err := index.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}()
|
|
|
|
doc := map[string]interface{}{
|
|
"body": "nodocid",
|
|
}
|
|
|
|
err = index.Index("", doc)
|
|
if err != ErrorEmptyID {
|
|
t.Errorf("expect index empty doc id to fail")
|
|
}
|
|
|
|
err = index.Delete("")
|
|
if err != ErrorEmptyID {
|
|
t.Errorf("expect delete empty doc id to fail")
|
|
}
|
|
|
|
batch := index.NewBatch()
|
|
err = batch.Index("", doc)
|
|
if err != ErrorEmptyID {
|
|
t.Errorf("expect index empty doc id in batch to fail")
|
|
}
|
|
|
|
batch.Delete("")
|
|
if batch.Size() > 0 {
|
|
t.Errorf("expect delete empty doc id in batch to be ignored")
|
|
}
|
|
}
|
|
|
|
func TestDateTimeFieldMappingIssue287(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
f := NewDateTimeFieldMapping()
|
|
|
|
m := NewIndexMapping()
|
|
m.DefaultMapping = NewDocumentMapping()
|
|
m.DefaultMapping.AddFieldMappingsAt("Date", f)
|
|
|
|
index, err := New(tmpIndexPath, m)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
type doc struct {
|
|
Date time.Time
|
|
}
|
|
|
|
now := time.Now()
|
|
|
|
// 3hr ago to 1hr ago
|
|
for i := 0; i < 3; i++ {
|
|
d := doc{now.Add(time.Duration((i - 3)) * time.Hour)}
|
|
|
|
err = index.Index(strconv.FormatInt(int64(i), 10), d)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
|
|
// search range across all docs
|
|
start := now.Add(-4 * time.Hour)
|
|
end := now
|
|
sreq := NewSearchRequest(NewDateRangeQuery(start, end))
|
|
sres, err := index.Search(sreq)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if sres.Total != 3 {
|
|
t.Errorf("expected 3 results, got %d", sres.Total)
|
|
}
|
|
|
|
// search range includes only oldest
|
|
start = now.Add(-4 * time.Hour)
|
|
end = now.Add(-121 * time.Minute)
|
|
sreq = NewSearchRequest(NewDateRangeQuery(start, end))
|
|
sres, err = index.Search(sreq)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if sres.Total != 1 {
|
|
t.Errorf("expected 1 results, got %d", sres.Total)
|
|
}
|
|
if sres.Total > 0 && sres.Hits[0].ID != "0" {
|
|
t.Errorf("expecated id '0', got '%s'", sres.Hits[0].ID)
|
|
}
|
|
|
|
// search range includes only newest
|
|
start = now.Add(-61 * time.Minute)
|
|
end = now
|
|
sreq = NewSearchRequest(NewDateRangeQuery(start, end))
|
|
sres, err = index.Search(sreq)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if sres.Total != 1 {
|
|
t.Errorf("expected 1 results, got %d", sres.Total)
|
|
}
|
|
if sres.Total > 0 && sres.Hits[0].ID != "2" {
|
|
t.Errorf("expecated id '2', got '%s'", sres.Hits[0].ID)
|
|
}
|
|
|
|
err = index.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
|
|
func TestDocumentFieldArrayPositionsBug295(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
index, err := New(tmpIndexPath, NewIndexMapping())
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
// index a document with an array of strings
|
|
err = index.Index("k", struct {
|
|
Messages []string
|
|
Another string
|
|
MoreData []string
|
|
}{
|
|
Messages: []string{
|
|
"bleve",
|
|
"bleve",
|
|
},
|
|
Another: "text",
|
|
MoreData: []string{
|
|
"a",
|
|
"b",
|
|
"c",
|
|
"bleve",
|
|
},
|
|
})
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
// search for it in the messages field
|
|
tq := NewTermQuery("bleve")
|
|
tq.SetField("Messages")
|
|
tsr := NewSearchRequest(tq)
|
|
tsr.IncludeLocations = true
|
|
results, err := index.Search(tsr)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if results.Total != 1 {
|
|
t.Fatalf("expected 1 result, got %d", results.Total)
|
|
}
|
|
if len(results.Hits[0].Locations["Messages"]["bleve"]) != 2 {
|
|
t.Fatalf("expected 2 locations of 'bleve', got %d", len(results.Hits[0].Locations["Messages"]["bleve"]))
|
|
}
|
|
if results.Hits[0].Locations["Messages"]["bleve"][0].ArrayPositions[0] != 0 {
|
|
t.Errorf("expected array position to be 0")
|
|
}
|
|
if results.Hits[0].Locations["Messages"]["bleve"][1].ArrayPositions[0] != 1 {
|
|
t.Errorf("expected array position to be 1")
|
|
}
|
|
|
|
// search for it in all
|
|
tq = NewTermQuery("bleve")
|
|
tsr = NewSearchRequest(tq)
|
|
tsr.IncludeLocations = true
|
|
results, err = index.Search(tsr)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if results.Total != 1 {
|
|
t.Fatalf("expected 1 result, got %d", results.Total)
|
|
}
|
|
if len(results.Hits[0].Locations["Messages"]["bleve"]) != 2 {
|
|
t.Fatalf("expected 2 locations of 'bleve', got %d", len(results.Hits[0].Locations["Messages"]["bleve"]))
|
|
}
|
|
if results.Hits[0].Locations["Messages"]["bleve"][0].ArrayPositions[0] != 0 {
|
|
t.Errorf("expected array position to be 0")
|
|
}
|
|
if results.Hits[0].Locations["Messages"]["bleve"][1].ArrayPositions[0] != 1 {
|
|
t.Errorf("expected array position to be 1")
|
|
}
|
|
|
|
err = index.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
|
|
func TestBooleanFieldMappingIssue109(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
m := NewIndexMapping()
|
|
m.DefaultMapping = NewDocumentMapping()
|
|
m.DefaultMapping.AddFieldMappingsAt("Bool", NewBooleanFieldMapping())
|
|
|
|
index, err := New(tmpIndexPath, m)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
type doc struct {
|
|
Bool bool
|
|
}
|
|
err = index.Index("true", &doc{Bool: true})
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
err = index.Index("false", &doc{Bool: false})
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
q := NewBoolFieldQuery(true)
|
|
q.SetField("Bool")
|
|
sreq := NewSearchRequest(q)
|
|
sres, err := index.Search(sreq)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if sres.Total != 1 {
|
|
t.Errorf("expected 1 results, got %d", sres.Total)
|
|
}
|
|
|
|
q = NewBoolFieldQuery(false)
|
|
q.SetField("Bool")
|
|
sreq = NewSearchRequest(q)
|
|
sres, err = index.Search(sreq)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if sres.Total != 1 {
|
|
t.Errorf("expected 1 results, got %d", sres.Total)
|
|
}
|
|
|
|
sreq = NewSearchRequest(NewBoolFieldQuery(true))
|
|
sres, err = index.Search(sreq)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if sres.Total != 1 {
|
|
t.Errorf("expected 1 results, got %d", sres.Total)
|
|
}
|
|
|
|
err = index.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
|
|
func TestSearchTimeout(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
index, err := New(tmpIndexPath, NewIndexMapping())
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
defer func() {
|
|
err := index.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}()
|
|
|
|
// first run a search with an absurdly long timeout (should succeed)
|
|
ctx, cancel := context.WithTimeout(context.Background(), 10*time.Second)
|
|
defer cancel()
|
|
query := NewTermQuery("water")
|
|
req := NewSearchRequest(query)
|
|
_, err = index.SearchInContext(ctx, req)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
// now run a search again with an absurdly low timeout (should timeout)
|
|
ctx, cancel = context.WithTimeout(context.Background(), 1*time.Microsecond)
|
|
defer cancel()
|
|
sq := &slowQuery{
|
|
actual: query,
|
|
delay: 50 * time.Millisecond, // on Windows timer resolution is 15ms
|
|
}
|
|
req.Query = sq
|
|
_, err = index.SearchInContext(ctx, req)
|
|
if err != context.DeadlineExceeded {
|
|
t.Fatalf("exected %v, got: %v", context.DeadlineExceeded, err)
|
|
}
|
|
|
|
// now run a search with a long timeout, but with a long query, and cancel it
|
|
ctx, cancel = context.WithTimeout(context.Background(), 10*time.Second)
|
|
sq = &slowQuery{
|
|
actual: query,
|
|
delay: 100 * time.Millisecond, // on Windows timer resolution is 15ms
|
|
}
|
|
req = NewSearchRequest(sq)
|
|
cancel()
|
|
_, err = index.SearchInContext(ctx, req)
|
|
if err != context.Canceled {
|
|
t.Fatalf("exected %v, got: %v", context.Canceled, err)
|
|
}
|
|
}
|
|
|
|
// TestConfigCache exposes a concurrent map write with go 1.6
|
|
func TestConfigCache(t *testing.T) {
|
|
for i := 0; i < 100; i++ {
|
|
go func() {
|
|
_, err := Config.Cache.HighlighterNamed(Config.DefaultHighlighter)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
}()
|
|
}
|
|
}
|
|
|
|
func TestBatchRaceBug260(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
i, err := New(tmpIndexPath, NewIndexMapping())
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
defer func() {
|
|
err := i.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}()
|
|
b := i.NewBatch()
|
|
err = b.Index("1", 1)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
err = i.Batch(b)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
b.Reset()
|
|
err = b.Index("2", 2)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
err = i.Batch(b)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
b.Reset()
|
|
}
|
|
|
|
func BenchmarkBatchOverhead(b *testing.B) {
|
|
tmpIndexPath := createTmpIndexPath(b)
|
|
defer cleanupTmpIndexPath(b, tmpIndexPath)
|
|
m := NewIndexMapping()
|
|
i, err := NewUsing(tmpIndexPath, m, Config.DefaultIndexType, null.Name, nil)
|
|
if err != nil {
|
|
b.Fatal(err)
|
|
}
|
|
for n := 0; n < b.N; n++ {
|
|
// put 1000 items in a batch
|
|
batch := i.NewBatch()
|
|
for i := 0; i < 1000; i++ {
|
|
err = batch.Index(fmt.Sprintf("%d", i), map[string]interface{}{"name": "bleve"})
|
|
if err != nil {
|
|
b.Fatal(err)
|
|
}
|
|
}
|
|
err = i.Batch(batch)
|
|
if err != nil {
|
|
b.Fatal(err)
|
|
}
|
|
batch.Reset()
|
|
}
|
|
}
|
|
|
|
func TestOpenReadonlyMultiple(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
// build an index and close it
|
|
index, err := New(tmpIndexPath, NewIndexMapping())
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
doca := map[string]interface{}{
|
|
"name": "marty",
|
|
"desc": "gophercon india",
|
|
}
|
|
err = index.Index("a", doca)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
err = index.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
// now open it read-only
|
|
index, err = OpenUsing(tmpIndexPath, map[string]interface{}{
|
|
"read_only": true,
|
|
})
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
// now open it again
|
|
index2, err := OpenUsing(tmpIndexPath, map[string]interface{}{
|
|
"read_only": true,
|
|
})
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
err = index.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
err = index2.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
|
|
// TestBug408 tests for VERY large values of size, even though actual result
|
|
// set may be reasonable size
|
|
func TestBug408(t *testing.T) {
|
|
type TestStruct struct {
|
|
ID string `json:"id"`
|
|
UserID *string `json:"user_id"`
|
|
}
|
|
|
|
docMapping := NewDocumentMapping()
|
|
docMapping.AddFieldMappingsAt("id", NewTextFieldMapping())
|
|
docMapping.AddFieldMappingsAt("user_id", NewTextFieldMapping())
|
|
|
|
indexMapping := NewIndexMapping()
|
|
indexMapping.DefaultMapping = docMapping
|
|
|
|
index, err := NewMemOnly(indexMapping)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
numToTest := 10
|
|
matchUserID := "match"
|
|
noMatchUserID := "no_match"
|
|
matchingDocIds := make(map[string]struct{})
|
|
|
|
for i := 0; i < numToTest; i++ {
|
|
ds := &TestStruct{"id_" + strconv.Itoa(i), nil}
|
|
if i%2 == 0 {
|
|
ds.UserID = &noMatchUserID
|
|
} else {
|
|
ds.UserID = &matchUserID
|
|
matchingDocIds[ds.ID] = struct{}{}
|
|
}
|
|
err = index.Index(ds.ID, ds)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
|
|
cnt, err := index.DocCount()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if int(cnt) != numToTest {
|
|
t.Fatalf("expected %d documents in index, got %d", numToTest, cnt)
|
|
}
|
|
|
|
q := NewTermQuery(matchUserID)
|
|
q.SetField("user_id")
|
|
searchReq := NewSearchRequestOptions(q, math.MaxInt32, 0, false)
|
|
results, err := index.Search(searchReq)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if int(results.Total) != numToTest/2 {
|
|
t.Fatalf("expected %d search hits, got %d", numToTest/2, results.Total)
|
|
}
|
|
|
|
for _, result := range results.Hits {
|
|
if _, found := matchingDocIds[result.ID]; !found {
|
|
t.Fatalf("document with ID %s not in results as expected", result.ID)
|
|
}
|
|
}
|
|
}
|
|
|
|
func TestIndexAdvancedCountMatchSearch(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
index, err := New(tmpIndexPath, NewIndexMapping())
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
var wg sync.WaitGroup
|
|
errChan := make(chan error, 10)
|
|
for i := 0; i < 10; i++ {
|
|
wg.Add(1)
|
|
go func(i int) {
|
|
defer wg.Done()
|
|
b := index.NewBatch()
|
|
for j := 0; j < 200; j++ {
|
|
id := fmt.Sprintf("%d", (i*200)+j)
|
|
|
|
doc := document.NewDocument(id)
|
|
doc.AddField(document.NewTextField("body", []uint64{}, []byte("match")))
|
|
doc.AddField(document.NewCompositeField("_all", true, []string{}, []string{}))
|
|
|
|
err := b.IndexAdvanced(doc)
|
|
if err != nil {
|
|
errChan <- err
|
|
return
|
|
}
|
|
}
|
|
err := index.Batch(b)
|
|
if err != nil {
|
|
errChan <- err
|
|
return
|
|
}
|
|
}(i)
|
|
}
|
|
wg.Wait()
|
|
|
|
close(errChan)
|
|
for err := range errChan {
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
|
|
// search for something that should match all documents
|
|
sr, err := index.Search(NewSearchRequest(NewMatchQuery("match")))
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
// get the index document count
|
|
dc, err := index.DocCount()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
// make sure test is working correctly, doc count should 2000
|
|
if dc != 2000 {
|
|
t.Errorf("expected doc count 2000, got %d", dc)
|
|
}
|
|
|
|
// make sure our search found all the documents
|
|
if dc != sr.Total {
|
|
t.Errorf("expected search result total %d to match doc count %d", sr.Total, dc)
|
|
}
|
|
|
|
err = index.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
|
|
func benchmarkSearchOverhead(indexType string, b *testing.B) {
|
|
tmpIndexPath := createTmpIndexPath(b)
|
|
defer cleanupTmpIndexPath(b, tmpIndexPath)
|
|
|
|
index, err := NewUsing(tmpIndexPath, NewIndexMapping(),
|
|
indexType, Config.DefaultKVStore, nil)
|
|
if err != nil {
|
|
b.Fatal(err)
|
|
}
|
|
defer func() {
|
|
err := index.Close()
|
|
if err != nil {
|
|
b.Fatal(err)
|
|
}
|
|
}()
|
|
|
|
elements := []string{"air", "water", "fire", "earth"}
|
|
for j := 0; j < 10000; j++ {
|
|
err = index.Index(fmt.Sprintf("%d", j),
|
|
map[string]interface{}{"name": elements[j%len(elements)]})
|
|
if err != nil {
|
|
b.Fatal(err)
|
|
}
|
|
}
|
|
|
|
query1 := NewTermQuery("water")
|
|
query2 := NewTermQuery("fire")
|
|
query := NewDisjunctionQuery(query1, query2)
|
|
req := NewSearchRequest(query)
|
|
|
|
b.ResetTimer()
|
|
|
|
for n := 0; n < b.N; n++ {
|
|
_, err = index.Search(req)
|
|
if err != nil {
|
|
b.Fatal(err)
|
|
}
|
|
}
|
|
}
|
|
|
|
func BenchmarkUpsidedownSearchOverhead(b *testing.B) {
|
|
benchmarkSearchOverhead(upsidedown.Name, b)
|
|
}
|
|
|
|
func BenchmarkScorchSearchOverhead(b *testing.B) {
|
|
benchmarkSearchOverhead(scorch.Name, b)
|
|
}
|
|
|
|
func TestSearchQueryCallback(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
index, err := New(tmpIndexPath, NewIndexMapping())
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
defer func() {
|
|
err := index.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}()
|
|
|
|
query := NewTermQuery("water")
|
|
req := NewSearchRequest(query)
|
|
|
|
expErr := fmt.Errorf("MEM_LIMIT_EXCEEDED")
|
|
f := func(size uint64) error {
|
|
// the intended usage of this callback is to see the estimated
|
|
// memory usage before executing, and possibly abort early
|
|
// in this test we simulate returning such an error
|
|
return expErr
|
|
}
|
|
|
|
ctx := context.WithValue(context.Background(), SearchQueryStartCallbackKey, SearchQueryStartCallbackFn(f))
|
|
_, err = index.SearchInContext(ctx, req)
|
|
if err != expErr {
|
|
t.Fatalf("Expected: %v, Got: %v", expErr, err)
|
|
}
|
|
}
|
|
|
|
func TestBatchMerge(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
idx, err := New(tmpIndexPath, NewIndexMapping())
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
doca := map[string]interface{}{
|
|
"name": "scorch",
|
|
"desc": "gophercon india",
|
|
"nation": "india",
|
|
}
|
|
|
|
batchA := idx.NewBatch()
|
|
err = batchA.Index("a", doca)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
batchA.SetInternal([]byte("batchkA"), []byte("batchvA"))
|
|
|
|
docb := map[string]interface{}{
|
|
"name": "moss",
|
|
"desc": "gophercon MV",
|
|
}
|
|
|
|
batchB := idx.NewBatch()
|
|
err = batchB.Index("b", docb)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
batchB.SetInternal([]byte("batchkB"), []byte("batchvB"))
|
|
|
|
docC := map[string]interface{}{
|
|
"name": "blahblah",
|
|
"desc": "inProgress",
|
|
"country": "usa",
|
|
}
|
|
|
|
batchC := idx.NewBatch()
|
|
err = batchC.Index("c", docC)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
batchC.SetInternal([]byte("batchkC"), []byte("batchvC"))
|
|
batchC.SetInternal([]byte("batchkB"), []byte("batchvBNew"))
|
|
batchC.Delete("a")
|
|
batchC.DeleteInternal([]byte("batchkA"))
|
|
|
|
batchA.Merge(batchB)
|
|
|
|
if batchA.Size() != 4 {
|
|
t.Errorf("expected batch size 4, got %d", batchA.Size())
|
|
}
|
|
|
|
batchA.Merge(batchC)
|
|
|
|
if batchA.Size() != 6 {
|
|
t.Errorf("expected batch size 6, got %d", batchA.Size())
|
|
}
|
|
|
|
err = idx.Batch(batchA)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
// close the index, open it again, and try some more things
|
|
err = idx.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
idx, err = Open(tmpIndexPath)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
defer func() {
|
|
err := idx.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}()
|
|
|
|
count, err := idx.DocCount()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if count != 2 {
|
|
t.Errorf("expected doc count 2, got %d", count)
|
|
}
|
|
|
|
doc, err := idx.Document("c")
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
val, err := idx.GetInternal([]byte("batchkB"))
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if val == nil || string(val) != "batchvBNew" {
|
|
t.Errorf("expected val: batchvBNew , got %s", val)
|
|
}
|
|
|
|
val, err = idx.GetInternal([]byte("batchkA"))
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if val != nil {
|
|
t.Errorf("expected nil, got %s", val)
|
|
}
|
|
|
|
foundNameField := false
|
|
doc.VisitFields(func(field index.Field) {
|
|
if field.Name() == "name" && string(field.Value()) == "blahblah" {
|
|
foundNameField = true
|
|
}
|
|
})
|
|
if !foundNameField {
|
|
t.Errorf("expected to find field named 'name' with value 'blahblah'")
|
|
}
|
|
|
|
fields, err := idx.Fields()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
expectedFields := map[string]bool{
|
|
"_all": false,
|
|
"name": false,
|
|
"desc": false,
|
|
"country": false,
|
|
}
|
|
if len(fields) < len(expectedFields) {
|
|
t.Fatalf("expected %d fields got %d", len(expectedFields), len(fields))
|
|
}
|
|
|
|
for _, f := range fields {
|
|
expectedFields[f] = true
|
|
}
|
|
|
|
for ef, efp := range expectedFields {
|
|
if !efp {
|
|
t.Errorf("field %s is missing", ef)
|
|
}
|
|
}
|
|
}
|
|
|
|
func TestBug1096(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
// use default mapping
|
|
mapping := NewIndexMapping()
|
|
|
|
// create a scorch index with default SAFE batches
|
|
var idx Index
|
|
idx, err = NewUsing(tmpIndexPath, mapping, "scorch", "scorch", nil)
|
|
if err != nil {
|
|
log.Fatal(err)
|
|
}
|
|
defer func() {
|
|
err := idx.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}()
|
|
|
|
// create a single batch instance that we will reuse
|
|
// this should be safe because we have single goroutine
|
|
// and we always wait for batch execution to finish
|
|
batch := idx.NewBatch()
|
|
|
|
// number of batches to execute
|
|
for i := 0; i < 10; i++ {
|
|
|
|
// number of documents to put into the batch
|
|
for j := 0; j < 91; j++ {
|
|
|
|
// create a doc id 0-90 (important so that we get id's 9 and 90)
|
|
// this could duplicate something already in the index
|
|
// this too should be OK and update the item in the index
|
|
id := fmt.Sprintf("%d", j)
|
|
|
|
err = batch.Index(id, map[string]interface{}{
|
|
"name": id,
|
|
"batch": fmt.Sprintf("%d", i),
|
|
})
|
|
if err != nil {
|
|
log.Fatal(err)
|
|
}
|
|
}
|
|
|
|
// execute the batch
|
|
err = idx.Batch(batch)
|
|
if err != nil {
|
|
log.Fatal(err)
|
|
}
|
|
|
|
// reset the batch before reusing it
|
|
batch.Reset()
|
|
}
|
|
|
|
// search for docs having name starting with the number 9
|
|
q := NewWildcardQuery("9*")
|
|
q.SetField("name")
|
|
req := NewSearchRequestOptions(q, 1000, 0, false)
|
|
req.Fields = []string{"*"}
|
|
var res *SearchResult
|
|
res, err = idx.Search(req)
|
|
if err != nil {
|
|
log.Fatal(err)
|
|
}
|
|
|
|
// we expect only 2 hits, for docs 9 and 90
|
|
if res.Total > 2 {
|
|
t.Fatalf("expected only 2 hits '9' and '90', got %v", res)
|
|
}
|
|
}
|
|
|
|
func TestDataRaceBug1092(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
// use default mapping
|
|
mapping := NewIndexMapping()
|
|
|
|
var idx Index
|
|
idx, err = NewUsing(tmpIndexPath, mapping, upsidedown.Name, boltdb.Name, nil)
|
|
if err != nil {
|
|
log.Fatal(err)
|
|
}
|
|
defer func() {
|
|
cerr := idx.Close()
|
|
if cerr != nil {
|
|
t.Fatal(cerr)
|
|
}
|
|
}()
|
|
|
|
batch := idx.NewBatch()
|
|
for i := 0; i < 10; i++ {
|
|
err = idx.Batch(batch)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
batch.Reset()
|
|
}
|
|
}
|
|
|
|
func TestBatchRaceBug1149(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
i, err := New(tmpIndexPath, NewIndexMapping())
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
defer func() {
|
|
err := i.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}()
|
|
testBatchRaceBug1149(t, i)
|
|
}
|
|
|
|
func TestBatchRaceBug1149Scorch(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
i, err := NewUsing(tmpIndexPath, NewIndexMapping(), "scorch", "scorch", nil)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
defer func() {
|
|
err := i.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}()
|
|
testBatchRaceBug1149(t, i)
|
|
}
|
|
|
|
func testBatchRaceBug1149(t *testing.T, i Index) {
|
|
b := i.NewBatch()
|
|
b.Delete("1")
|
|
err = i.Batch(b)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
b.Reset()
|
|
err = i.Batch(b)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
b.Reset()
|
|
}
|
|
|
|
func TestOptimisedConjunctionSearchHits(t *testing.T) {
|
|
scorch.OptimizeDisjunctionUnadorned = false
|
|
defer func() {
|
|
scorch.OptimizeDisjunctionUnadorned = true
|
|
}()
|
|
|
|
defer func() {
|
|
err := os.RemoveAll("testidx")
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}()
|
|
|
|
idx, err := NewUsing("testidx", NewIndexMapping(), "scorch", "scorch", nil)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
doca := map[string]interface{}{
|
|
"country": "united",
|
|
"name": "Mercure Hotel",
|
|
"directions": "B560 and B56 Follow signs to the M56",
|
|
}
|
|
docb := map[string]interface{}{
|
|
"country": "united",
|
|
"name": "Mercure Altrincham Bowdon Hotel",
|
|
"directions": "A570 and A57 Follow signs to the M56 Manchester Airport",
|
|
}
|
|
docc := map[string]interface{}{
|
|
"country": "india united",
|
|
"name": "Sonoma Hotel",
|
|
"directions": "Northwest",
|
|
}
|
|
docd := map[string]interface{}{
|
|
"country": "United Kingdom",
|
|
"name": "Cresta Court Hotel",
|
|
"directions": "junction of A560 and A56",
|
|
}
|
|
|
|
b := idx.NewBatch()
|
|
err = b.Index("a", doca)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
err = b.Index("b", docb)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
err = b.Index("c", docc)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
err = b.Index("d", docd)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
// execute the batch
|
|
err = idx.Batch(b)
|
|
if err != nil {
|
|
log.Fatal(err)
|
|
}
|
|
|
|
mq := NewMatchQuery("united")
|
|
mq.SetField("country")
|
|
|
|
cq := NewConjunctionQuery(mq)
|
|
|
|
mq1 := NewMatchQuery("hotel")
|
|
mq1.SetField("name")
|
|
cq.AddQuery(mq1)
|
|
|
|
mq2 := NewMatchQuery("56")
|
|
mq2.SetField("directions")
|
|
mq2.SetFuzziness(1)
|
|
cq.AddQuery(mq2)
|
|
|
|
req := NewSearchRequest(cq)
|
|
req.Score = "none"
|
|
|
|
res, err := idx.Search(req)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
hitsWithOutScore := res.Total
|
|
|
|
req = NewSearchRequest(cq)
|
|
req.Score = ""
|
|
|
|
res, err = idx.Search(req)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
hitsWithScore := res.Total
|
|
|
|
if hitsWithOutScore != hitsWithScore {
|
|
t.Errorf("expected %d hits without score, got %d", hitsWithScore, hitsWithOutScore)
|
|
}
|
|
|
|
err = idx.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
|
|
func TestIndexMappingDocValuesDynamic(t *testing.T) {
|
|
im := NewIndexMapping()
|
|
// DocValuesDynamic's default is true
|
|
// Now explicitly set it to false
|
|
im.DocValuesDynamic = false
|
|
|
|
// Next, retrieve the JSON dump of the index mapping
|
|
var data []byte
|
|
data, err = json.Marshal(im)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
// Now, edit an unrelated setting in the index mapping
|
|
var m map[string]interface{}
|
|
err = json.Unmarshal(data, &m)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
m["index_dynamic"] = false
|
|
data, err = json.Marshal(m)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
// Unmarshal back the changes into the index mapping struct
|
|
if err = im.UnmarshalJSON(data); err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
// Expect DocValuesDynamic to remain false!
|
|
if im.DocValuesDynamic {
|
|
t.Fatalf("Expected DocValuesDynamic to remain false after the index mapping edit")
|
|
}
|
|
}
|
|
|
|
func TestCopyIndex(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
idx, err := New(tmpIndexPath, NewIndexMapping())
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
defer func() {
|
|
err := idx.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}()
|
|
|
|
doca := map[string]interface{}{
|
|
"name": "tester",
|
|
"desc": "gophercon india testing",
|
|
}
|
|
err = idx.Index("a", doca)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
docy := map[string]interface{}{
|
|
"name": "jasper",
|
|
"desc": "clojure",
|
|
}
|
|
err = idx.Index("y", docy)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
err = idx.Delete("y")
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
docx := map[string]interface{}{
|
|
"name": "rose",
|
|
"desc": "xoogler",
|
|
}
|
|
err = idx.Index("x", docx)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
err = idx.SetInternal([]byte("status"), []byte("pending"))
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
docb := map[string]interface{}{
|
|
"name": "sree",
|
|
"desc": "cbft janitor",
|
|
}
|
|
batch := idx.NewBatch()
|
|
err = batch.Index("b", docb)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
batch.Delete("x")
|
|
batch.SetInternal([]byte("batchi"), []byte("batchv"))
|
|
batch.DeleteInternal([]byte("status"))
|
|
err = idx.Batch(batch)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
val, err := idx.GetInternal([]byte("batchi"))
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
if string(val) != "batchv" {
|
|
t.Errorf("expected 'batchv', got '%s'", val)
|
|
}
|
|
val, err = idx.GetInternal([]byte("status"))
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
if val != nil {
|
|
t.Errorf("expected nil, got '%s'", val)
|
|
}
|
|
|
|
err = idx.SetInternal([]byte("seqno"), []byte("7"))
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
err = idx.SetInternal([]byte("status"), []byte("ready"))
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
err = idx.DeleteInternal([]byte("status"))
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
val, err = idx.GetInternal([]byte("status"))
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
if val != nil {
|
|
t.Errorf("expected nil, got '%s'", val)
|
|
}
|
|
|
|
val, err = idx.GetInternal([]byte("seqno"))
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
if string(val) != "7" {
|
|
t.Errorf("expected '7', got '%s'", val)
|
|
}
|
|
|
|
count, err := idx.DocCount()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if count != 2 {
|
|
t.Errorf("expected doc count 2, got %d", count)
|
|
}
|
|
|
|
doc, err := idx.Document("a")
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
foundNameField := false
|
|
doc.VisitFields(func(field index.Field) {
|
|
if field.Name() == "name" && string(field.Value()) == "tester" {
|
|
foundNameField = true
|
|
}
|
|
})
|
|
if !foundNameField {
|
|
t.Errorf("expected to find field named 'name' with value 'tester'")
|
|
}
|
|
|
|
fields, err := idx.Fields()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
expectedFields := map[string]bool{
|
|
"_all": false,
|
|
"name": false,
|
|
"desc": false,
|
|
}
|
|
if len(fields) < len(expectedFields) {
|
|
t.Fatalf("expected %d fields got %d", len(expectedFields), len(fields))
|
|
}
|
|
for _, f := range fields {
|
|
expectedFields[f] = true
|
|
}
|
|
for ef, efp := range expectedFields {
|
|
if !efp {
|
|
t.Errorf("field %s is missing", ef)
|
|
}
|
|
}
|
|
|
|
// now create a copy of the index, and repeat assertions on it
|
|
copyableIndex, ok := idx.(IndexCopyable)
|
|
if !ok {
|
|
t.Fatal("index doesn't support copy")
|
|
}
|
|
backupIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, backupIndexPath)
|
|
|
|
err = copyableIndex.CopyTo(FileSystemDirectory(backupIndexPath))
|
|
if err != nil {
|
|
t.Fatalf("error copying the index: %v", err)
|
|
}
|
|
|
|
// open the copied index
|
|
idxCopied, err := Open(backupIndexPath)
|
|
if err != nil {
|
|
t.Fatalf("unable to open copy index")
|
|
}
|
|
defer func() {
|
|
err := idxCopied.Close()
|
|
if err != nil {
|
|
t.Fatalf("error closing copy index: %v", err)
|
|
}
|
|
}()
|
|
|
|
// assertions on copied index
|
|
copyCount, err := idxCopied.DocCount()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
if copyCount != 2 {
|
|
t.Errorf("expected doc count 2, got %d", copyCount)
|
|
}
|
|
|
|
copyDoc, err := idxCopied.Document("a")
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
copyFoundNameField := false
|
|
copyDoc.VisitFields(func(field index.Field) {
|
|
if field.Name() == "name" && string(field.Value()) == "tester" {
|
|
copyFoundNameField = true
|
|
}
|
|
})
|
|
if !copyFoundNameField {
|
|
t.Errorf("expected copy index to find field named 'name' with value 'tester'")
|
|
}
|
|
|
|
copyFields, err := idx.Fields()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
copyExpectedFields := map[string]bool{
|
|
"_all": false,
|
|
"name": false,
|
|
"desc": false,
|
|
}
|
|
if len(copyFields) < len(copyExpectedFields) {
|
|
t.Fatalf("expected %d fields got %d", len(copyExpectedFields), len(copyFields))
|
|
}
|
|
for _, f := range copyFields {
|
|
copyExpectedFields[f] = true
|
|
}
|
|
for ef, efp := range copyExpectedFields {
|
|
if !efp {
|
|
t.Errorf("copy field %s is missing", ef)
|
|
}
|
|
}
|
|
}
|
|
|
|
func TestFuzzyScoring(t *testing.T) {
|
|
tmpIndexPath := createTmpIndexPath(t)
|
|
defer cleanupTmpIndexPath(t, tmpIndexPath)
|
|
|
|
mp := NewIndexMapping()
|
|
mp.DefaultAnalyzer = "simple"
|
|
idx, err := New(tmpIndexPath, mp)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
batch := idx.NewBatch()
|
|
|
|
docs := []map[string]interface{}{
|
|
{
|
|
"textField": "ab",
|
|
},
|
|
{
|
|
"textField": "abc",
|
|
},
|
|
{
|
|
"textField": "abcd",
|
|
},
|
|
}
|
|
|
|
for _, doc := range docs {
|
|
err := batch.Index(fmt.Sprintf("%v", doc["textField"]), doc)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|
|
|
|
err = idx.Batch(batch)
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
|
|
query := NewFuzzyQuery("ab")
|
|
query.Fuzziness = 2
|
|
searchRequest := NewSearchRequestOptions(query, 10, 0, true)
|
|
res, err := idx.Search(searchRequest)
|
|
if err != nil {
|
|
t.Error(err)
|
|
}
|
|
|
|
maxScore := res.Hits[0].Score
|
|
|
|
for i, hit := range res.Hits {
|
|
if maxScore/float64(i+1) != hit.Score {
|
|
t.Errorf("expected score - %f, got score - %f", maxScore/float64(i+1), hit.Score)
|
|
}
|
|
}
|
|
|
|
err = idx.Close()
|
|
if err != nil {
|
|
t.Fatal(err)
|
|
}
|
|
}
|