// Copyright (c) 2014 Couchbase, Inc. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. package bleve import ( "context" "encoding/json" "fmt" "io" "log" "math" "os" "path/filepath" "reflect" "sort" "strconv" "strings" "sync" "testing" "time" "github.com/blevesearch/bleve/v2/analysis/analyzer/keyword" "github.com/blevesearch/bleve/v2/document" "github.com/blevesearch/bleve/v2/index/upsidedown/store/boltdb" "github.com/blevesearch/bleve/v2/index/upsidedown/store/null" "github.com/blevesearch/bleve/v2/mapping" "github.com/blevesearch/bleve/v2/search" "github.com/blevesearch/bleve/v2/search/query" index "github.com/blevesearch/bleve_index_api" "github.com/blevesearch/bleve/v2/index/scorch" "github.com/blevesearch/bleve/v2/index/upsidedown" ) type Fatalfable interface { Fatalf(format string, args ...interface{}) } func createTmpIndexPath(f Fatalfable) string { tmpIndexPath, err := os.MkdirTemp("", "bleve-testidx") if err != nil { f.Fatalf("error creating temp dir: %v", err) } return tmpIndexPath } func cleanupTmpIndexPath(f Fatalfable, path string) { err := os.RemoveAll(path) if err != nil { f.Fatalf("error removing temp dir: %v", err) } } func TestCrud(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) idx, err := New(tmpIndexPath, NewIndexMapping()) if err != nil { t.Fatal(err) } doca := map[string]interface{}{ "name": "marty", "desc": "gophercon india", } err = idx.Index("a", doca) if err != nil { t.Error(err) } docy := map[string]interface{}{ "name": "jasper", "desc": "clojure", } err = idx.Index("y", docy) if err != nil { t.Error(err) } err = idx.Delete("y") if err != nil { t.Error(err) } docx := map[string]interface{}{ "name": "rose", "desc": "googler", } err = idx.Index("x", docx) if err != nil { t.Error(err) } err = idx.SetInternal([]byte("status"), []byte("pending")) if err != nil { t.Error(err) } docb := map[string]interface{}{ "name": "steve", "desc": "cbft master", } batch := idx.NewBatch() err = batch.Index("b", docb) if err != nil { t.Error(err) } batch.Delete("x") batch.SetInternal([]byte("batchi"), []byte("batchv")) batch.DeleteInternal([]byte("status")) err = idx.Batch(batch) if err != nil { t.Error(err) } val, err := idx.GetInternal([]byte("batchi")) if err != nil { t.Error(err) } if string(val) != "batchv" { t.Errorf("expected 'batchv', got '%s'", val) } val, err = idx.GetInternal([]byte("status")) if err != nil { t.Error(err) } if val != nil { t.Errorf("expected nil, got '%s'", val) } err = idx.SetInternal([]byte("seqno"), []byte("7")) if err != nil { t.Error(err) } err = idx.SetInternal([]byte("status"), []byte("ready")) if err != nil { t.Error(err) } err = idx.DeleteInternal([]byte("status")) if err != nil { t.Error(err) } val, err = idx.GetInternal([]byte("status")) if err != nil { t.Error(err) } if val != nil { t.Errorf("expected nil, got '%s'", val) } val, err = idx.GetInternal([]byte("seqno")) if err != nil { t.Error(err) } if string(val) != "7" { t.Errorf("expected '7', got '%s'", val) } // close the index, open it again, and try some more things err = idx.Close() if err != nil { t.Fatal(err) } idx, err = Open(tmpIndexPath) if err != nil { t.Fatal(err) } defer func() { err := idx.Close() if err != nil { t.Fatal(err) } }() count, err := idx.DocCount() if err != nil { t.Fatal(err) } if count != 2 { t.Errorf("expected doc count 2, got %d", count) } doc, err := idx.Document("a") if err != nil { t.Fatal(err) } foundNameField := false doc.VisitFields(func(field index.Field) { if field.Name() == "name" && string(field.Value()) == "marty" { foundNameField = true } }) if !foundNameField { t.Errorf("expected to find field named 'name' with value 'marty'") } fields, err := idx.Fields() if err != nil { t.Fatal(err) } expectedFields := map[string]bool{ "_all": false, "name": false, "desc": false, } if len(fields) < len(expectedFields) { t.Fatalf("expected %d fields got %d", len(expectedFields), len(fields)) } for _, f := range fields { expectedFields[f] = true } for ef, efp := range expectedFields { if !efp { t.Errorf("field %s is missing", ef) } } } func approxSame(actual, expected uint64) bool { modulus := func(a, b uint64) uint64 { if a > b { return a - b } return b - a } return float64(modulus(actual, expected))/float64(expected) < float64(0.30) } func checkStatsOnIndexedBatch(indexPath string, indexMapping mapping.IndexMapping, expectedVal uint64, ) error { var wg sync.WaitGroup var statValError error idx, err := NewUsing(indexPath, indexMapping, Config.DefaultIndexType, Config.DefaultMemKVStore, nil) if err != nil { return err } batch, err := getBatchFromData(idx, "sample-data.json") if err != nil { return fmt.Errorf("failed to form a batch %v\n", err) } wg.Add(1) batch.SetPersistedCallback(func(e error) { defer wg.Done() stats, _ := idx.StatsMap()["index"].(map[string]interface{}) bytesWritten, _ := stats["num_bytes_written_at_index_time"].(uint64) if !approxSame(bytesWritten, expectedVal) { statValError = fmt.Errorf("expected bytes written is %d, got %v", expectedVal, bytesWritten) } }) err = idx.Batch(batch) if err != nil { return fmt.Errorf("failed to index batch %v\n", err) } wg.Wait() idx.Close() return statValError } func TestBytesWritten(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) indexMapping := NewIndexMapping() indexMapping.TypeField = "type" indexMapping.DefaultAnalyzer = "en" documentMapping := NewDocumentMapping() indexMapping.AddDocumentMapping("hotel", documentMapping) indexMapping.DocValuesDynamic = false indexMapping.StoreDynamic = false contentFieldMapping := NewTextFieldMapping() contentFieldMapping.Index = true contentFieldMapping.Store = false contentFieldMapping.IncludeInAll = false contentFieldMapping.IncludeTermVectors = false contentFieldMapping.DocValues = false reviewsMapping := NewDocumentMapping() reviewsMapping.AddFieldMappingsAt("content", contentFieldMapping) documentMapping.AddSubDocumentMapping("reviews", reviewsMapping) typeFieldMapping := NewTextFieldMapping() typeFieldMapping.Store = false typeFieldMapping.IncludeInAll = false typeFieldMapping.IncludeTermVectors = false typeFieldMapping.DocValues = false documentMapping.AddFieldMappingsAt("type", typeFieldMapping) err = checkStatsOnIndexedBatch(tmpIndexPath, indexMapping, 57273) if err != nil { t.Fatal(err) } cleanupTmpIndexPath(t, tmpIndexPath) contentFieldMapping.Store = true tmpIndexPath1 := createTmpIndexPath(t) err := checkStatsOnIndexedBatch(tmpIndexPath1, indexMapping, 76069) if err != nil { t.Fatal(err) } cleanupTmpIndexPath(t, tmpIndexPath1) contentFieldMapping.Store = false contentFieldMapping.IncludeInAll = true tmpIndexPath2 := createTmpIndexPath(t) err = checkStatsOnIndexedBatch(tmpIndexPath2, indexMapping, 68875) if err != nil { t.Fatal(err) } cleanupTmpIndexPath(t, tmpIndexPath2) contentFieldMapping.IncludeInAll = false contentFieldMapping.IncludeTermVectors = true tmpIndexPath3 := createTmpIndexPath(t) err = checkStatsOnIndexedBatch(tmpIndexPath3, indexMapping, 78985) if err != nil { t.Fatal(err) } cleanupTmpIndexPath(t, tmpIndexPath3) contentFieldMapping.IncludeTermVectors = false contentFieldMapping.DocValues = true tmpIndexPath4 := createTmpIndexPath(t) err = checkStatsOnIndexedBatch(tmpIndexPath4, indexMapping, 64228) if err != nil { t.Fatal(err) } cleanupTmpIndexPath(t, tmpIndexPath4) } func createIndexMappingOnSampleData() *mapping.IndexMappingImpl { indexMapping := NewIndexMapping() indexMapping.TypeField = "type" indexMapping.DefaultAnalyzer = "en" indexMapping.ScoringModel = index.DefaultScoringModel documentMapping := NewDocumentMapping() indexMapping.AddDocumentMapping("hotel", documentMapping) indexMapping.StoreDynamic = false indexMapping.DocValuesDynamic = false contentFieldMapping := NewTextFieldMapping() contentFieldMapping.Store = false reviewsMapping := NewDocumentMapping() reviewsMapping.AddFieldMappingsAt("content", contentFieldMapping) documentMapping.AddSubDocumentMapping("reviews", reviewsMapping) typeFieldMapping := NewTextFieldMapping() typeFieldMapping.Store = false documentMapping.AddFieldMappingsAt("type", typeFieldMapping) return indexMapping } func TestBM25TFIDFScoring(t *testing.T) { tmpIndexPath1 := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath1) tmpIndexPath2 := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath2) indexMapping := createIndexMappingOnSampleData() indexMapping.ScoringModel = index.BM25Scoring indexBM25, err := NewUsing(tmpIndexPath1, indexMapping, Config.DefaultIndexType, Config.DefaultMemKVStore, nil) if err != nil { t.Fatal(err) } indexMapping1 := createIndexMappingOnSampleData() indexTFIDF, err := NewUsing(tmpIndexPath2, indexMapping1, Config.DefaultIndexType, Config.DefaultMemKVStore, nil) if err != nil { t.Fatal(err) } defer func() { err := indexBM25.Close() if err != nil { t.Fatal(err) } err = indexTFIDF.Close() if err != nil { t.Fatal(err) } }() batch, err := getBatchFromData(indexBM25, "sample-data.json") if err != nil { t.Fatalf("failed to form a batch") } err = indexBM25.Batch(batch) if err != nil { t.Fatalf("failed to index batch %v\n", err) } query := NewMatchQuery("Hotel") query.FieldVal = "name" searchRequest := NewSearchRequestOptions(query, int(10), 0, true) resBM25, err := indexBM25.Search(searchRequest) if err != nil { t.Error(err) } batch, err = getBatchFromData(indexTFIDF, "sample-data.json") if err != nil { t.Fatalf("failed to form a batch") } err = indexTFIDF.Batch(batch) if err != nil { t.Fatalf("failed to index batch %v\n", err) } resTFIDF, err := indexTFIDF.Search(searchRequest) if err != nil { t.Error(err) } for i, hit := range resTFIDF.Hits { if hit.Score < resBM25.Hits[i].Score { t.Fatalf("expected the score to be higher for BM25, got %v and %v", resBM25.Hits[i].Score, hit.Score) } } } func TestBM25GlobalScoring(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) indexMapping := createIndexMappingOnSampleData() indexMapping.ScoringModel = index.BM25Scoring idxSinglePartition, err := NewUsing(tmpIndexPath, indexMapping, Config.DefaultIndexType, Config.DefaultMemKVStore, nil) if err != nil { t.Fatal(err) } defer func() { err := idxSinglePartition.Close() if err != nil { t.Fatal(err) } }() batch, err := getBatchFromData(idxSinglePartition, "sample-data.json") if err != nil { t.Fatalf("failed to form a batch") } err = idxSinglePartition.Batch(batch) if err != nil { t.Fatalf("failed to index batch %v\n", err) } query := NewMatchQuery("Hotel") query.FieldVal = "name" searchRequest := NewSearchRequestOptions(query, int(10), 0, true) res, err := idxSinglePartition.Search(searchRequest) if err != nil { t.Error(err) } singlePartHits := res.Hits dataset, _ := readDataFromFile("sample-data.json") tmpIndexPath1 := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath1) idxPart1, err := NewUsing(tmpIndexPath1, indexMapping, Config.DefaultIndexType, Config.DefaultMemKVStore, nil) if err != nil { t.Fatal(err) } defer func() { err := idxPart1.Close() if err != nil { t.Fatal(err) } }() batch1 := idxPart1.NewBatch() for _, doc := range dataset[:len(dataset)/2] { err = batch1.Index(fmt.Sprintf("%d", doc["id"]), doc) if err != nil { t.Fatal(err) } } err = idxPart1.Batch(batch1) if err != nil { t.Fatal(err) } tmpIndexPath2 := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath2) idxPart2, err := NewUsing(tmpIndexPath2, indexMapping, Config.DefaultIndexType, Config.DefaultMemKVStore, nil) if err != nil { t.Fatal(err) } defer func() { err := idxPart2.Close() if err != nil { t.Fatal(err) } }() batch2 := idxPart2.NewBatch() for _, doc := range dataset[len(dataset)/2:] { err = batch2.Index(fmt.Sprintf("%d", doc["id"]), doc) if err != nil { t.Fatal(err) } } err = idxPart2.Batch(batch2) if err != nil { t.Fatal(err) } multiPartIndex := NewIndexAlias(idxPart1, idxPart2) err = multiPartIndex.SetIndexMapping(indexMapping) if err != nil { t.Fatal(err) } ctx := context.Background() // this key is set to ensure that we have a consistent scoring at the index alias // level (it forces a pre search phase which can have a small overhead) ctx = context.WithValue(ctx, search.SearchTypeKey, search.GlobalScoring) res, err = multiPartIndex.SearchInContext(ctx, searchRequest) if err != nil { t.Error(err) } for i, hit := range res.Hits { if hit.Score != singlePartHits[i].Score { t.Fatalf("expected the scores to be the same, got %v and %v", hit.Score, singlePartHits[i].Score) } } } func TestBytesRead(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) indexMapping := NewIndexMapping() indexMapping.TypeField = "type" indexMapping.DefaultAnalyzer = "en" documentMapping := NewDocumentMapping() indexMapping.AddDocumentMapping("hotel", documentMapping) indexMapping.StoreDynamic = false indexMapping.DocValuesDynamic = false contentFieldMapping := NewTextFieldMapping() contentFieldMapping.Store = false reviewsMapping := NewDocumentMapping() reviewsMapping.AddFieldMappingsAt("content", contentFieldMapping) documentMapping.AddSubDocumentMapping("reviews", reviewsMapping) typeFieldMapping := NewTextFieldMapping() typeFieldMapping.Store = false documentMapping.AddFieldMappingsAt("type", typeFieldMapping) idx, err := NewUsing(tmpIndexPath, indexMapping, Config.DefaultIndexType, Config.DefaultMemKVStore, nil) if err != nil { t.Fatal(err) } defer func() { err := idx.Close() if err != nil { t.Fatal(err) } }() batch, err := getBatchFromData(idx, "sample-data.json") if err != nil { t.Fatalf("failed to form a batch") } err = idx.Batch(batch) if err != nil { t.Fatalf("failed to index batch %v\n", err) } query := NewQueryStringQuery("united") searchRequest := NewSearchRequestOptions(query, int(10), 0, true) res, err := idx.Search(searchRequest) if err != nil { t.Error(err) } stats, _ := idx.StatsMap()["index"].(map[string]interface{}) prevBytesRead, _ := stats["num_bytes_read_at_query_time"].(uint64) expectedBytesRead := uint64(22049) if supportForVectorSearch { expectedBytesRead = 22459 } if prevBytesRead != expectedBytesRead && res.Cost == prevBytesRead { t.Fatalf("expected bytes read for query string %v, got %v", expectedBytesRead, prevBytesRead) } // subsequent queries on the same field results in lesser amount // of bytes read because the segment static and dictionary is reused and not // loaded from mmap'd filed res, err = idx.Search(searchRequest) if err != nil { t.Error(err) } stats, _ = idx.StatsMap()["index"].(map[string]interface{}) bytesRead, _ := stats["num_bytes_read_at_query_time"].(uint64) if bytesRead-prevBytesRead != 66 && res.Cost == bytesRead-prevBytesRead { t.Fatalf("expected bytes read for query string 66, got %v", bytesRead-prevBytesRead) } prevBytesRead = bytesRead fuzz := NewFuzzyQuery("hotel") fuzz.FieldVal = "reviews.content" fuzz.Fuzziness = 2 searchRequest = NewSearchRequest(fuzz) res, err = idx.Search(searchRequest) if err != nil { t.Error(err) } stats, _ = idx.StatsMap()["index"].(map[string]interface{}) bytesRead, _ = stats["num_bytes_read_at_query_time"].(uint64) if bytesRead-prevBytesRead != 8468 && res.Cost == bytesRead-prevBytesRead { t.Fatalf("expected bytes read for fuzzy query is 8468, got %v", bytesRead-prevBytesRead) } prevBytesRead = bytesRead typeFacet := NewFacetRequest("type", 2) query = NewQueryStringQuery("united") searchRequest = NewSearchRequestOptions(query, int(0), 0, true) searchRequest.AddFacet("types", typeFacet) res, err = idx.Search(searchRequest) if err != nil { t.Error(err) } stats, _ = idx.StatsMap()["index"].(map[string]interface{}) bytesRead, _ = stats["num_bytes_read_at_query_time"].(uint64) if !approxSame(bytesRead-prevBytesRead, 196) && res.Cost == bytesRead-prevBytesRead { t.Fatalf("expected bytes read for faceted query is around 196, got %v", bytesRead-prevBytesRead) } prevBytesRead = bytesRead min := float64(8660) max := float64(8665) numRangeQuery := NewNumericRangeQuery(&min, &max) numRangeQuery.FieldVal = "id" searchRequest = NewSearchRequestOptions(numRangeQuery, int(10), 0, true) res, err = idx.Search(searchRequest) if err != nil { t.Error(err) } stats, _ = idx.StatsMap()["index"].(map[string]interface{}) bytesRead, _ = stats["num_bytes_read_at_query_time"].(uint64) if bytesRead-prevBytesRead != 924 && res.Cost == bytesRead-prevBytesRead { t.Fatalf("expected bytes read for numeric range query is 924, got %v", bytesRead-prevBytesRead) } prevBytesRead = bytesRead searchRequest = NewSearchRequestOptions(query, int(10), 0, true) searchRequest.Highlight = &HighlightRequest{} res, err = idx.Search(searchRequest) if err != nil { t.Error(err) } stats, _ = idx.StatsMap()["index"].(map[string]interface{}) bytesRead, _ = stats["num_bytes_read_at_query_time"].(uint64) if bytesRead-prevBytesRead != 105 && res.Cost == bytesRead-prevBytesRead { t.Fatalf("expected bytes read for query with highlighter is 105, got %v", bytesRead-prevBytesRead) } prevBytesRead = bytesRead disQuery := NewDisjunctionQuery(NewMatchQuery("hotel"), NewMatchQuery("united")) searchRequest = NewSearchRequestOptions(disQuery, int(10), 0, true) res, err = idx.Search(searchRequest) if err != nil { t.Error(err) } // expectation is that the bytes read is roughly equal to sum of sub queries in // the disjunction query plus the segment loading portion for the second subquery // since it's created afresh and not reused stats, _ = idx.StatsMap()["index"].(map[string]interface{}) bytesRead, _ = stats["num_bytes_read_at_query_time"].(uint64) if bytesRead-prevBytesRead != 120 && res.Cost == bytesRead-prevBytesRead { t.Fatalf("expected bytes read for disjunction query is 120, got %v", bytesRead-prevBytesRead) } } func TestBytesReadStored(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) indexMapping := NewIndexMapping() indexMapping.TypeField = "type" indexMapping.DefaultAnalyzer = "en" documentMapping := NewDocumentMapping() indexMapping.AddDocumentMapping("hotel", documentMapping) indexMapping.DocValuesDynamic = false indexMapping.StoreDynamic = false contentFieldMapping := NewTextFieldMapping() contentFieldMapping.Store = true contentFieldMapping.IncludeInAll = false contentFieldMapping.IncludeTermVectors = false reviewsMapping := NewDocumentMapping() reviewsMapping.AddFieldMappingsAt("content", contentFieldMapping) documentMapping.AddSubDocumentMapping("reviews", reviewsMapping) typeFieldMapping := NewTextFieldMapping() typeFieldMapping.Store = false typeFieldMapping.IncludeInAll = false typeFieldMapping.IncludeTermVectors = false documentMapping.AddFieldMappingsAt("type", typeFieldMapping) idx, err := NewUsing(tmpIndexPath, indexMapping, Config.DefaultIndexType, Config.DefaultMemKVStore, nil) if err != nil { t.Fatal(err) } batch, err := getBatchFromData(idx, "sample-data.json") if err != nil { t.Fatalf("failed to form a batch %v\n", err) } err = idx.Batch(batch) if err != nil { t.Fatalf("failed to index batch %v\n", err) } query := NewTermQuery("hotel") query.FieldVal = "reviews.content" searchRequest := NewSearchRequestOptions(query, int(10), 0, true) res, err := idx.Search(searchRequest) if err != nil { t.Error(err) } stats, _ := idx.StatsMap()["index"].(map[string]interface{}) bytesRead, _ := stats["num_bytes_read_at_query_time"].(uint64) expectedBytesRead := uint64(11911) if supportForVectorSearch { expectedBytesRead = 12321 } if bytesRead != expectedBytesRead && bytesRead == res.Cost { t.Fatalf("expected the bytes read stat to be around %v, got %v", expectedBytesRead, bytesRead) } prevBytesRead := bytesRead searchRequest = NewSearchRequestOptions(query, int(10), 0, true) res, err = idx.Search(searchRequest) if err != nil { t.Error(err) } stats, _ = idx.StatsMap()["index"].(map[string]interface{}) bytesRead, _ = stats["num_bytes_read_at_query_time"].(uint64) if bytesRead-prevBytesRead != 48 && bytesRead-prevBytesRead == res.Cost { t.Fatalf("expected the bytes read stat to be around 48, got %v", bytesRead-prevBytesRead) } prevBytesRead = bytesRead searchRequest = NewSearchRequestOptions(query, int(10), 0, true) searchRequest.Fields = []string{"*"} res, err = idx.Search(searchRequest) if err != nil { t.Error(err) } stats, _ = idx.StatsMap()["index"].(map[string]interface{}) bytesRead, _ = stats["num_bytes_read_at_query_time"].(uint64) if bytesRead-prevBytesRead != 26511 && bytesRead-prevBytesRead == res.Cost { t.Fatalf("expected the bytes read stat to be around 26511, got %v", bytesRead-prevBytesRead) } idx.Close() cleanupTmpIndexPath(t, tmpIndexPath) // same type of querying but on field "type" contentFieldMapping.Store = false typeFieldMapping.Store = true tmpIndexPath1 := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath1) idx1, err := NewUsing(tmpIndexPath1, indexMapping, Config.DefaultIndexType, Config.DefaultMemKVStore, nil) if err != nil { t.Fatal(err) } defer func() { err := idx1.Close() if err != nil { t.Fatal(err) } }() batch, err = getBatchFromData(idx1, "sample-data.json") if err != nil { t.Fatalf("failed to form a batch %v\n", err) } err = idx1.Batch(batch) if err != nil { t.Fatalf("failed to index batch %v\n", err) } query = NewTermQuery("hotel") query.FieldVal = "type" searchRequest = NewSearchRequestOptions(query, int(10), 0, true) res, err = idx1.Search(searchRequest) if err != nil { t.Error(err) } stats, _ = idx1.StatsMap()["index"].(map[string]interface{}) bytesRead, _ = stats["num_bytes_read_at_query_time"].(uint64) expectedBytesRead = uint64(4097) if supportForVectorSearch { expectedBytesRead = 4507 } if bytesRead != expectedBytesRead && bytesRead == res.Cost { t.Fatalf("expected the bytes read stat to be around %v, got %v", expectedBytesRead, bytesRead) } prevBytesRead = bytesRead res, err = idx1.Search(searchRequest) if err != nil { t.Error(err) } stats, _ = idx1.StatsMap()["index"].(map[string]interface{}) bytesRead, _ = stats["num_bytes_read_at_query_time"].(uint64) if bytesRead-prevBytesRead != 47 && bytesRead-prevBytesRead == res.Cost { t.Fatalf("expected the bytes read stat to be around 47, got %v", bytesRead-prevBytesRead) } prevBytesRead = bytesRead searchRequest.Fields = []string{"*"} res, err = idx1.Search(searchRequest) if err != nil { t.Error(err) } stats, _ = idx1.StatsMap()["index"].(map[string]interface{}) bytesRead, _ = stats["num_bytes_read_at_query_time"].(uint64) if bytesRead-prevBytesRead != 77 && bytesRead-prevBytesRead == res.Cost { t.Fatalf("expected the bytes read stat to be around 77, got %v", bytesRead-prevBytesRead) } } func readDataFromFile(fileName string) ([]map[string]interface{}, error) { pwd, err := os.Getwd() if err != nil { return nil, err } path := filepath.Join(pwd, "data", "test", fileName) var dataset []map[string]interface{} fileContent, err := os.ReadFile(path) if err != nil { return nil, err } err = json.Unmarshal(fileContent, &dataset) if err != nil { return nil, err } return dataset, nil } func getBatchFromData(idx Index, fileName string) (*Batch, error) { dataset, err := readDataFromFile(fileName) batch := idx.NewBatch() for _, doc := range dataset { err = batch.Index(fmt.Sprintf("%d", doc["id"]), doc) if err != nil { return nil, err } } return batch, err } func TestIndexCreateNewOverExisting(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) index, err := New(tmpIndexPath, NewIndexMapping()) if err != nil { t.Fatal(err) } err = index.Close() if err != nil { t.Fatal(err) } _, err = New(tmpIndexPath, NewIndexMapping()) if err != ErrorIndexPathExists { t.Fatalf("expected error index path exists, got %v", err) } } func TestIndexOpenNonExisting(t *testing.T) { _, err := Open("doesnotexist") if err != ErrorIndexPathDoesNotExist { t.Fatalf("expected error index path does not exist, got %v", err) } } func TestIndexOpenMetaMissingOrCorrupt(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) index, err := New(tmpIndexPath, NewIndexMapping()) if err != nil { t.Fatal(err) } err = index.Close() if err != nil { t.Fatal(err) } tmpIndexPathMeta := filepath.Join(tmpIndexPath, "index_meta.json") // now intentionally change the storage type err = os.WriteFile(tmpIndexPathMeta, []byte(`{"storage":"mystery"}`), 0o666) if err != nil { t.Fatal(err) } _, err = Open(tmpIndexPath) if err == nil { t.Fatalf("expected error for unknown storage type, got %v", err) } // now intentionally corrupt the metadata err = os.WriteFile(tmpIndexPathMeta, []byte("corrupted"), 0o666) if err != nil { t.Fatal(err) } _, err = Open(tmpIndexPath) if err != ErrorIndexMetaCorrupt { t.Fatalf("expected error index metadata corrupted, got %v", err) } // now intentionally remove the metadata err = os.Remove(tmpIndexPathMeta) if err != nil { t.Fatal(err) } _, err = Open(tmpIndexPath) if err != ErrorIndexMetaMissing { t.Fatalf("expected error index metadata missing, got %v", err) } } func TestInMemIndex(t *testing.T) { index, err := NewMemOnly(NewIndexMapping()) if err != nil { t.Fatal(err) } err = index.Close() if err != nil { t.Fatal(err) } } func TestClosedIndex(t *testing.T) { index, err := NewMemOnly(NewIndexMapping()) if err != nil { t.Fatal(err) } err = index.Close() if err != nil { t.Fatal(err) } err = index.Index("test", "test") if err != ErrorIndexClosed { t.Errorf("expected error index closed, got %v", err) } err = index.Delete("test") if err != ErrorIndexClosed { t.Errorf("expected error index closed, got %v", err) } b := index.NewBatch() err = index.Batch(b) if err != ErrorIndexClosed { t.Errorf("expected error index closed, got %v", err) } _, err = index.Document("test") if err != ErrorIndexClosed { t.Errorf("expected error index closed, got %v", err) } _, err = index.DocCount() if err != ErrorIndexClosed { t.Errorf("expected error index closed, got %v", err) } _, err = index.Search(NewSearchRequest(NewTermQuery("test"))) if err != ErrorIndexClosed { t.Errorf("expected error index closed, got %v", err) } _, err = index.Fields() if err != ErrorIndexClosed { t.Errorf("expected error index closed, got %v", err) } } type slowQuery struct { actual query.Query delay time.Duration } func (s *slowQuery) Searcher(ctx context.Context, i index.IndexReader, m mapping.IndexMapping, options search.SearcherOptions) (search.Searcher, error) { time.Sleep(s.delay) return s.actual.Searcher(ctx, i, m, options) } func TestSlowSearch(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) defer func() { // reset logger back to normal SetLog(log.New(io.Discard, "bleve", log.LstdFlags)) }() // set custom logger var sdw sawDataWriter SetLog(log.New(&sdw, "bleve", log.LstdFlags)) index, err := New(tmpIndexPath, NewIndexMapping()) if err != nil { t.Fatal(err) } defer func() { err := index.Close() if err != nil { t.Fatal(err) } }() Config.SlowSearchLogThreshold = 1 * time.Minute query := NewTermQuery("water") req := NewSearchRequest(query) _, err = index.Search(req) if err != nil { t.Fatal(err) } if sdw.sawData { t.Errorf("expected to not see slow query logged, but did") } sq := &slowQuery{ actual: query, delay: 50 * time.Millisecond, // on Windows timer resolution is 15ms } req.Query = sq Config.SlowSearchLogThreshold = 1 * time.Microsecond _, err = index.Search(req) if err != nil { t.Fatal(err) } if !sdw.sawData { t.Errorf("expected to see slow query logged, but didn't") } } type sawDataWriter struct { sawData bool } func (s *sawDataWriter) Write(p []byte) (n int, err error) { s.sawData = true return len(p), nil } func TestStoredFieldPreserved(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) index, err := New(tmpIndexPath, NewIndexMapping()) if err != nil { t.Fatal(err) } defer func() { err := index.Close() if err != nil { t.Fatal(err) } }() doca := map[string]interface{}{ "name": "Marty", "desc": "GopherCON India", "bool": true, "num": float64(1), } err = index.Index("a", doca) if err != nil { t.Error(err) } q := NewTermQuery("marty") req := NewSearchRequest(q) req.Fields = []string{"name", "desc", "bool", "num"} res, err := index.Search(req) if err != nil { t.Error(err) } if len(res.Hits) != 1 { t.Fatalf("expected 1 hit, got %d", len(res.Hits)) } if res.Hits[0].Fields["name"] != "Marty" { t.Errorf("expected 'Marty' got '%s'", res.Hits[0].Fields["name"]) } if res.Hits[0].Fields["desc"] != "GopherCON India" { t.Errorf("expected 'GopherCON India' got '%s'", res.Hits[0].Fields["desc"]) } if res.Hits[0].Fields["num"] != float64(1) { t.Errorf("expected '1' got '%v'", res.Hits[0].Fields["num"]) } if res.Hits[0].Fields["bool"] != true { t.Errorf("expected 'true' got '%v'", res.Hits[0].Fields["bool"]) } } func TestDict(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) index, err := New(tmpIndexPath, NewIndexMapping()) if err != nil { t.Fatal(err) } doca := map[string]interface{}{ "name": "marty", "desc": "gophercon india", } err = index.Index("a", doca) if err != nil { t.Error(err) } docy := map[string]interface{}{ "name": "jasper", "desc": "clojure", } err = index.Index("y", docy) if err != nil { t.Error(err) } docx := map[string]interface{}{ "name": "rose", "desc": "googler", } err = index.Index("x", docx) if err != nil { t.Error(err) } dict, err := index.FieldDict("name") if err != nil { t.Error(err) } terms := []string{} de, err := dict.Next() for err == nil && de != nil { terms = append(terms, string(de.Term)) de, err = dict.Next() } expectedTerms := []string{"jasper", "marty", "rose"} if !reflect.DeepEqual(terms, expectedTerms) { t.Errorf("expected %v, got %v", expectedTerms, terms) } err = dict.Close() if err != nil { t.Fatal(err) } // test start and end range dict, err = index.FieldDictRange("name", []byte("marty"), []byte("rose")) if err != nil { t.Error(err) } terms = []string{} de, err = dict.Next() for err == nil && de != nil { terms = append(terms, string(de.Term)) de, err = dict.Next() } expectedTerms = []string{"marty", "rose"} if !reflect.DeepEqual(terms, expectedTerms) { t.Errorf("expected %v, got %v", expectedTerms, terms) } err = dict.Close() if err != nil { t.Fatal(err) } docz := map[string]interface{}{ "name": "prefix", "desc": "bob cat cats catting dog doggy zoo", } err = index.Index("z", docz) if err != nil { t.Error(err) } dict, err = index.FieldDictPrefix("desc", []byte("cat")) if err != nil { t.Error(err) } terms = []string{} de, err = dict.Next() for err == nil && de != nil { terms = append(terms, string(de.Term)) de, err = dict.Next() } expectedTerms = []string{"cat", "cats", "catting"} if !reflect.DeepEqual(terms, expectedTerms) { t.Errorf("expected %v, got %v", expectedTerms, terms) } stats := index.Stats() if stats == nil { t.Errorf("expected IndexStat, got nil") } err = dict.Close() if err != nil { t.Fatal(err) } err = index.Close() if err != nil { t.Fatal(err) } } func TestBatchString(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) index, err := New(tmpIndexPath, NewIndexMapping()) if err != nil { t.Fatal(err) } defer func() { err := index.Close() if err != nil { t.Fatal(err) } }() batch := index.NewBatch() err = batch.Index("a", []byte("{}")) if err != nil { t.Fatal(err) } batch.Delete("b") batch.SetInternal([]byte("c"), []byte{}) batch.DeleteInternal([]byte("d")) batchStr := batch.String() if !strings.HasPrefix(batchStr, "Batch (2 ops, 2 internal ops)") { t.Errorf("expected to start with Batch (2 ops, 2 internal ops), did not") } if !strings.Contains(batchStr, "INDEX - 'a'") { t.Errorf("expected to contain INDEX - 'a', did not") } if !strings.Contains(batchStr, "DELETE - 'b'") { t.Errorf("expected to contain DELETE - 'b', did not") } if !strings.Contains(batchStr, "SET INTERNAL - 'c'") { t.Errorf("expected to contain SET INTERNAL - 'c', did not") } if !strings.Contains(batchStr, "DELETE INTERNAL - 'd'") { t.Errorf("expected to contain DELETE INTERNAL - 'd', did not") } } func TestIndexMetadataRaceBug198(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) index, err := New(tmpIndexPath, NewIndexMapping()) if err != nil { t.Fatal(err) } defer func() { err := index.Close() if err != nil { t.Fatal(err) } }() wg := sync.WaitGroup{} wg.Add(1) done := make(chan struct{}) go func() { for { select { case <-done: wg.Done() return default: _, err2 := index.DocCount() if err2 != nil { t.Error(err2) wg.Done() return } } } }() for i := 0; i < 100; i++ { batch := index.NewBatch() err = batch.Index("a", []byte("{}")) if err != nil { t.Fatal(err) } err = index.Batch(batch) if err != nil { t.Fatal(err) } } close(done) wg.Wait() } func TestSortMatchSearch(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) index, err := New(tmpIndexPath, NewIndexMapping()) if err != nil { t.Fatal(err) } names := []string{"Noam", "Uri", "David", "Yosef", "Eitan", "Itay", "Ariel", "Daniel", "Omer", "Yogev", "Yehonatan", "Moshe", "Mohammed", "Yusuf", "Omar"} days := []string{"Sunday", "Monday", "Tuesday", "Wednesday", "Thursday", "Friday", "Saturday"} numbers := []string{"One", "Two", "Three", "Four", "Five", "Six", "Seven", "Eight", "Nine", "Ten", "Eleven", "Twelve"} b := index.NewBatch() for i := 0; i < 200; i++ { doc := make(map[string]interface{}) doc["Name"] = names[i%len(names)] doc["Day"] = days[i%len(days)] doc["Number"] = numbers[i%len(numbers)] err = b.Index(fmt.Sprintf("%d", i), doc) if err != nil { t.Fatal(err) } } err = index.Batch(b) if err != nil { t.Fatal(err) } req := NewSearchRequest(NewMatchQuery("One")) req.SortBy([]string{"Day", "Name"}) req.Fields = []string{"*"} sr, err := index.Search(req) if err != nil { t.Fatal(err) } prev := "" for _, hit := range sr.Hits { val := hit.Fields["Day"].(string) if prev > val { t.Errorf("Hits must be sorted by 'Day'. Found '%s' before '%s'", prev, val) } prev = val } err = index.Close() if err != nil { t.Fatal(err) } } func TestIndexCountMatchSearch(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) index, err := New(tmpIndexPath, NewIndexMapping()) if err != nil { t.Fatal(err) } var wg sync.WaitGroup for i := 0; i < 10; i++ { wg.Add(1) go func(i int) { b := index.NewBatch() for j := 0; j < 200; j++ { id := fmt.Sprintf("%d", (i*200)+j) doc := struct { Body string }{ Body: "match", } err := b.Index(id, doc) if err != nil { t.Error(err) wg.Done() return } } err := index.Batch(b) if err != nil { t.Error(err) wg.Done() return } wg.Done() }(i) } wg.Wait() // search for something that should match all documents sr, err := index.Search(NewSearchRequest(NewMatchQuery("match"))) if err != nil { t.Fatal(err) } // get the index document count dc, err := index.DocCount() if err != nil { t.Fatal(err) } // make sure test is working correctly, doc count should 2000 if dc != 2000 { t.Errorf("expected doc count 2000, got %d", dc) } // make sure our search found all the documents if dc != sr.Total { t.Errorf("expected search result total %d to match doc count %d", sr.Total, dc) } err = index.Close() if err != nil { t.Fatal(err) } } func TestBatchReset(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) index, err := New(tmpIndexPath, NewIndexMapping()) if err != nil { t.Fatal(err) } batch := index.NewBatch() err = batch.Index("k1", struct { Body string }{ Body: "v1", }) if err != nil { t.Error(err) } batch.Delete("k2") batch.SetInternal([]byte("k3"), []byte("v3")) batch.DeleteInternal([]byte("k4")) if batch.Size() != 4 { t.Logf("%v", batch) t.Errorf("expected batch size 4, got %d", batch.Size()) } batch.Reset() if batch.Size() != 0 { t.Errorf("expected batch size 0 after reset, got %d", batch.Size()) } err = index.Close() if err != nil { t.Fatal(err) } } func TestDocumentFieldArrayPositions(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) idx, err := New(tmpIndexPath, NewIndexMapping()) if err != nil { t.Fatal(err) } // index a document with an array of strings err = idx.Index("k", struct { Messages []string }{ Messages: []string{ "first", "second", "third", "last", }, }) if err != nil { t.Fatal(err) } // load the document doc, err := idx.Document("k") if err != nil { t.Fatal(err) } doc.VisitFields(func(f index.Field) { if reflect.DeepEqual(f.Value(), []byte("first")) { ap := f.ArrayPositions() if len(ap) < 1 { t.Errorf("expected an array position, got none") return } if ap[0] != 0 { t.Errorf("expected 'first' in array position 0, got %d", ap[0]) } } if reflect.DeepEqual(f.Value(), []byte("second")) { ap := f.ArrayPositions() if len(ap) < 1 { t.Errorf("expected an array position, got none") return } if ap[0] != 1 { t.Errorf("expected 'second' in array position 1, got %d", ap[0]) } } if reflect.DeepEqual(f.Value(), []byte("third")) { ap := f.ArrayPositions() if len(ap) < 1 { t.Errorf("expected an array position, got none") return } if ap[0] != 2 { t.Errorf("expected 'third' in array position 2, got %d", ap[0]) } } if reflect.DeepEqual(f.Value(), []byte("last")) { ap := f.ArrayPositions() if len(ap) < 1 { t.Errorf("expected an array position, got none") return } if ap[0] != 3 { t.Errorf("expected 'last' in array position 3, got %d", ap[0]) } } }) // now index a document in the same field with a single string err = idx.Index("k2", struct { Messages string }{ Messages: "only", }) if err != nil { t.Fatal(err) } // load the document doc, err = idx.Document("k2") if err != nil { t.Fatal(err) } doc.VisitFields(func(f index.Field) { if reflect.DeepEqual(f.Value(), []byte("only")) { ap := f.ArrayPositions() if len(ap) != 0 { t.Errorf("expected no array positions, got %d", len(ap)) return } } }) err = idx.Close() if err != nil { t.Fatal(err) } } func TestKeywordSearchBug207(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) f := NewTextFieldMapping() f.Analyzer = keyword.Name m := NewIndexMapping() m.DefaultMapping = NewDocumentMapping() m.DefaultMapping.AddFieldMappingsAt("Body", f) index, err := New(tmpIndexPath, m) if err != nil { t.Fatal(err) } doc1 := struct { Body string }{ Body: "a555c3bb06f7a127cda000005", } err = index.Index("a", doc1) if err != nil { t.Fatal(err) } doc2 := struct { Body string }{ Body: "555c3bb06f7a127cda000005", } err = index.Index("b", doc2) if err != nil { t.Fatal(err) } // now search for these terms sreq := NewSearchRequest(NewTermQuery("a555c3bb06f7a127cda000005")) sres, err := index.Search(sreq) if err != nil { t.Fatal(err) } if sres.Total != 1 { t.Errorf("expected 1 result, got %d", sres.Total) } if sres.Hits[0].ID != "a" { t.Errorf("expecated id 'a', got '%s'", sres.Hits[0].ID) } sreq = NewSearchRequest(NewTermQuery("555c3bb06f7a127cda000005")) sres, err = index.Search(sreq) if err != nil { t.Fatal(err) } if sres.Total != 1 { t.Errorf("expected 1 result, got %d", sres.Total) } if sres.Hits[0].ID != "b" { t.Errorf("expecated id 'b', got '%s'", sres.Hits[0].ID) } // now do the same searches using query strings sreq = NewSearchRequest(NewQueryStringQuery("Body:a555c3bb06f7a127cda000005")) sres, err = index.Search(sreq) if err != nil { t.Fatal(err) } if sres.Total != 1 { t.Errorf("expected 1 result, got %d", sres.Total) } if sres.Hits[0].ID != "a" { t.Errorf("expecated id 'a', got '%s'", sres.Hits[0].ID) } sreq = NewSearchRequest(NewQueryStringQuery(`Body:555c3bb06f7a127cda000005`)) sres, err = index.Search(sreq) if err != nil { t.Fatal(err) } if sres.Total != 1 { t.Errorf("expected 1 result, got %d", sres.Total) } if sres.Hits[0].ID != "b" { t.Errorf("expecated id 'b', got '%s'", sres.Hits[0].ID) } err = index.Close() if err != nil { t.Fatal(err) } } func TestTermVectorArrayPositions(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) index, err := New(tmpIndexPath, NewIndexMapping()) if err != nil { t.Fatal(err) } // index a document with an array of strings err = index.Index("k", struct { Messages []string }{ Messages: []string{ "first", "second", "third", "last", }, }) if err != nil { t.Fatal(err) } // search for this document in all field tq := NewTermQuery("second") tsr := NewSearchRequest(tq) tsr.IncludeLocations = true results, err := index.Search(tsr) if err != nil { t.Fatal(err) } if results.Total != 1 { t.Fatalf("expected 1 result, got %d", results.Total) } if len(results.Hits[0].Locations["Messages"]["second"]) < 1 { t.Fatalf("expected at least one location") } if len(results.Hits[0].Locations["Messages"]["second"][0].ArrayPositions) < 1 { t.Fatalf("expected at least one location array position") } if results.Hits[0].Locations["Messages"]["second"][0].ArrayPositions[0] != 1 { t.Fatalf("expected array position 1, got %d", results.Hits[0].Locations["Messages"]["second"][0].ArrayPositions[0]) } // repeat search for this document in Messages field tq2 := NewTermQuery("third") tq2.SetField("Messages") tsr = NewSearchRequest(tq2) tsr.IncludeLocations = true results, err = index.Search(tsr) if err != nil { t.Fatal(err) } if results.Total != 1 { t.Fatalf("expected 1 result, got %d", results.Total) } if len(results.Hits[0].Locations["Messages"]["third"]) < 1 { t.Fatalf("expected at least one location") } if len(results.Hits[0].Locations["Messages"]["third"][0].ArrayPositions) < 1 { t.Fatalf("expected at least one location array position") } if results.Hits[0].Locations["Messages"]["third"][0].ArrayPositions[0] != 2 { t.Fatalf("expected array position 2, got %d", results.Hits[0].Locations["Messages"]["third"][0].ArrayPositions[0]) } err = index.Close() if err != nil { t.Fatal(err) } } func TestDocumentStaticMapping(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) m := NewIndexMapping() m.DefaultMapping = NewDocumentStaticMapping() m.DefaultMapping.AddFieldMappingsAt("Text", NewTextFieldMapping()) m.DefaultMapping.AddFieldMappingsAt("Date", NewDateTimeFieldMapping()) m.DefaultMapping.AddFieldMappingsAt("Numeric", NewNumericFieldMapping()) index, err := New(tmpIndexPath, m) if err != nil { t.Fatal(err) } doc1 := struct { Text string IgnoredText string Numeric float64 IgnoredNumeric float64 Date time.Time IgnoredDate time.Time }{ Text: "valid text", IgnoredText: "ignored text", Numeric: 10, IgnoredNumeric: 20, Date: time.Unix(1, 0), IgnoredDate: time.Unix(2, 0), } err = index.Index("a", doc1) if err != nil { t.Fatal(err) } fields, err := index.Fields() if err != nil { t.Fatal(err) } sort.Strings(fields) expectedFields := []string{"Date", "Numeric", "Text", "_all"} if len(fields) < len(expectedFields) { t.Fatalf("invalid field count: %d", len(fields)) } for i, expected := range expectedFields { if expected != fields[i] { t.Fatalf("unexpected field[%d]: %s", i, fields[i]) } } err = index.Close() if err != nil { t.Fatal(err) } } func TestIndexEmptyDocId(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) index, err := New(tmpIndexPath, NewIndexMapping()) if err != nil { t.Fatal(err) } defer func() { err := index.Close() if err != nil { t.Fatal(err) } }() doc := map[string]interface{}{ "body": "nodocid", } err = index.Index("", doc) if err != ErrorEmptyID { t.Errorf("expect index empty doc id to fail") } err = index.Delete("") if err != ErrorEmptyID { t.Errorf("expect delete empty doc id to fail") } batch := index.NewBatch() err = batch.Index("", doc) if err != ErrorEmptyID { t.Errorf("expect index empty doc id in batch to fail") } batch.Delete("") if batch.Size() > 0 { t.Errorf("expect delete empty doc id in batch to be ignored") } } func TestDateTimeFieldMappingIssue287(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) f := NewDateTimeFieldMapping() m := NewIndexMapping() m.DefaultMapping = NewDocumentMapping() m.DefaultMapping.AddFieldMappingsAt("Date", f) index, err := New(tmpIndexPath, m) if err != nil { t.Fatal(err) } type doc struct { Date time.Time } now := time.Now() // 3hr ago to 1hr ago for i := 0; i < 3; i++ { d := doc{now.Add(time.Duration((i - 3)) * time.Hour)} err = index.Index(strconv.FormatInt(int64(i), 10), d) if err != nil { t.Fatal(err) } } // search range across all docs start := now.Add(-4 * time.Hour) end := now sreq := NewSearchRequest(NewDateRangeQuery(start, end)) sres, err := index.Search(sreq) if err != nil { t.Fatal(err) } if sres.Total != 3 { t.Errorf("expected 3 results, got %d", sres.Total) } // search range includes only oldest start = now.Add(-4 * time.Hour) end = now.Add(-121 * time.Minute) sreq = NewSearchRequest(NewDateRangeQuery(start, end)) sres, err = index.Search(sreq) if err != nil { t.Fatal(err) } if sres.Total != 1 { t.Errorf("expected 1 results, got %d", sres.Total) } if sres.Total > 0 && sres.Hits[0].ID != "0" { t.Errorf("expecated id '0', got '%s'", sres.Hits[0].ID) } // search range includes only newest start = now.Add(-61 * time.Minute) end = now sreq = NewSearchRequest(NewDateRangeQuery(start, end)) sres, err = index.Search(sreq) if err != nil { t.Fatal(err) } if sres.Total != 1 { t.Errorf("expected 1 results, got %d", sres.Total) } if sres.Total > 0 && sres.Hits[0].ID != "2" { t.Errorf("expecated id '2', got '%s'", sres.Hits[0].ID) } err = index.Close() if err != nil { t.Fatal(err) } } func TestDocumentFieldArrayPositionsBug295(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) index, err := New(tmpIndexPath, NewIndexMapping()) if err != nil { t.Fatal(err) } // index a document with an array of strings err = index.Index("k", struct { Messages []string Another string MoreData []string }{ Messages: []string{ "bleve", "bleve", }, Another: "text", MoreData: []string{ "a", "b", "c", "bleve", }, }) if err != nil { t.Fatal(err) } // search for it in the messages field tq := NewTermQuery("bleve") tq.SetField("Messages") tsr := NewSearchRequest(tq) tsr.IncludeLocations = true results, err := index.Search(tsr) if err != nil { t.Fatal(err) } if results.Total != 1 { t.Fatalf("expected 1 result, got %d", results.Total) } if len(results.Hits[0].Locations["Messages"]["bleve"]) != 2 { t.Fatalf("expected 2 locations of 'bleve', got %d", len(results.Hits[0].Locations["Messages"]["bleve"])) } if results.Hits[0].Locations["Messages"]["bleve"][0].ArrayPositions[0] != 0 { t.Errorf("expected array position to be 0") } if results.Hits[0].Locations["Messages"]["bleve"][1].ArrayPositions[0] != 1 { t.Errorf("expected array position to be 1") } // search for it in all tq = NewTermQuery("bleve") tsr = NewSearchRequest(tq) tsr.IncludeLocations = true results, err = index.Search(tsr) if err != nil { t.Fatal(err) } if results.Total != 1 { t.Fatalf("expected 1 result, got %d", results.Total) } if len(results.Hits[0].Locations["Messages"]["bleve"]) != 2 { t.Fatalf("expected 2 locations of 'bleve', got %d", len(results.Hits[0].Locations["Messages"]["bleve"])) } if results.Hits[0].Locations["Messages"]["bleve"][0].ArrayPositions[0] != 0 { t.Errorf("expected array position to be 0") } if results.Hits[0].Locations["Messages"]["bleve"][1].ArrayPositions[0] != 1 { t.Errorf("expected array position to be 1") } err = index.Close() if err != nil { t.Fatal(err) } } func TestBooleanFieldMappingIssue109(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) m := NewIndexMapping() m.DefaultMapping = NewDocumentMapping() m.DefaultMapping.AddFieldMappingsAt("Bool", NewBooleanFieldMapping()) index, err := New(tmpIndexPath, m) if err != nil { t.Fatal(err) } type doc struct { Bool bool } err = index.Index("true", &doc{Bool: true}) if err != nil { t.Fatal(err) } err = index.Index("false", &doc{Bool: false}) if err != nil { t.Fatal(err) } q := NewBoolFieldQuery(true) q.SetField("Bool") sreq := NewSearchRequest(q) sres, err := index.Search(sreq) if err != nil { t.Fatal(err) } if sres.Total != 1 { t.Errorf("expected 1 results, got %d", sres.Total) } q = NewBoolFieldQuery(false) q.SetField("Bool") sreq = NewSearchRequest(q) sres, err = index.Search(sreq) if err != nil { t.Fatal(err) } if sres.Total != 1 { t.Errorf("expected 1 results, got %d", sres.Total) } sreq = NewSearchRequest(NewBoolFieldQuery(true)) sres, err = index.Search(sreq) if err != nil { t.Fatal(err) } if sres.Total != 1 { t.Errorf("expected 1 results, got %d", sres.Total) } err = index.Close() if err != nil { t.Fatal(err) } } func TestSearchTimeout(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) index, err := New(tmpIndexPath, NewIndexMapping()) if err != nil { t.Fatal(err) } defer func() { err := index.Close() if err != nil { t.Fatal(err) } }() // first run a search with an absurdly long timeout (should succeed) ctx, cancel := context.WithTimeout(context.Background(), 10*time.Second) defer cancel() query := NewTermQuery("water") req := NewSearchRequest(query) _, err = index.SearchInContext(ctx, req) if err != nil { t.Fatal(err) } // now run a search again with an absurdly low timeout (should timeout) ctx, cancel = context.WithTimeout(context.Background(), 1*time.Microsecond) defer cancel() sq := &slowQuery{ actual: query, delay: 50 * time.Millisecond, // on Windows timer resolution is 15ms } req.Query = sq _, err = index.SearchInContext(ctx, req) if err != context.DeadlineExceeded { t.Fatalf("exected %v, got: %v", context.DeadlineExceeded, err) } // now run a search with a long timeout, but with a long query, and cancel it ctx, cancel = context.WithTimeout(context.Background(), 10*time.Second) sq = &slowQuery{ actual: query, delay: 100 * time.Millisecond, // on Windows timer resolution is 15ms } req = NewSearchRequest(sq) cancel() _, err = index.SearchInContext(ctx, req) if err != context.Canceled { t.Fatalf("exected %v, got: %v", context.Canceled, err) } } // TestConfigCache exposes a concurrent map write with go 1.6 func TestConfigCache(t *testing.T) { for i := 0; i < 100; i++ { go func() { _, err := Config.Cache.HighlighterNamed(Config.DefaultHighlighter) if err != nil { t.Error(err) } }() } } func TestBatchRaceBug260(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) i, err := New(tmpIndexPath, NewIndexMapping()) if err != nil { t.Fatal(err) } defer func() { err := i.Close() if err != nil { t.Fatal(err) } }() b := i.NewBatch() err = b.Index("1", 1) if err != nil { t.Fatal(err) } err = i.Batch(b) if err != nil { t.Fatal(err) } b.Reset() err = b.Index("2", 2) if err != nil { t.Fatal(err) } err = i.Batch(b) if err != nil { t.Fatal(err) } b.Reset() } func BenchmarkBatchOverhead(b *testing.B) { tmpIndexPath := createTmpIndexPath(b) defer cleanupTmpIndexPath(b, tmpIndexPath) m := NewIndexMapping() i, err := NewUsing(tmpIndexPath, m, Config.DefaultIndexType, null.Name, nil) if err != nil { b.Fatal(err) } for n := 0; n < b.N; n++ { // put 1000 items in a batch batch := i.NewBatch() for i := 0; i < 1000; i++ { err = batch.Index(fmt.Sprintf("%d", i), map[string]interface{}{"name": "bleve"}) if err != nil { b.Fatal(err) } } err = i.Batch(batch) if err != nil { b.Fatal(err) } batch.Reset() } } func TestOpenReadonlyMultiple(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) // build an index and close it index, err := New(tmpIndexPath, NewIndexMapping()) if err != nil { t.Fatal(err) } doca := map[string]interface{}{ "name": "marty", "desc": "gophercon india", } err = index.Index("a", doca) if err != nil { t.Fatal(err) } err = index.Close() if err != nil { t.Fatal(err) } // now open it read-only index, err = OpenUsing(tmpIndexPath, map[string]interface{}{ "read_only": true, }) if err != nil { t.Fatal(err) } // now open it again index2, err := OpenUsing(tmpIndexPath, map[string]interface{}{ "read_only": true, }) if err != nil { t.Fatal(err) } err = index.Close() if err != nil { t.Fatal(err) } err = index2.Close() if err != nil { t.Fatal(err) } } // TestBug408 tests for VERY large values of size, even though actual result // set may be reasonable size func TestBug408(t *testing.T) { type TestStruct struct { ID string `json:"id"` UserID *string `json:"user_id"` } docMapping := NewDocumentMapping() docMapping.AddFieldMappingsAt("id", NewTextFieldMapping()) docMapping.AddFieldMappingsAt("user_id", NewTextFieldMapping()) indexMapping := NewIndexMapping() indexMapping.DefaultMapping = docMapping index, err := NewMemOnly(indexMapping) if err != nil { t.Fatal(err) } numToTest := 10 matchUserID := "match" noMatchUserID := "no_match" matchingDocIds := make(map[string]struct{}) for i := 0; i < numToTest; i++ { ds := &TestStruct{"id_" + strconv.Itoa(i), nil} if i%2 == 0 { ds.UserID = &noMatchUserID } else { ds.UserID = &matchUserID matchingDocIds[ds.ID] = struct{}{} } err = index.Index(ds.ID, ds) if err != nil { t.Fatal(err) } } cnt, err := index.DocCount() if err != nil { t.Fatal(err) } if int(cnt) != numToTest { t.Fatalf("expected %d documents in index, got %d", numToTest, cnt) } q := NewTermQuery(matchUserID) q.SetField("user_id") searchReq := NewSearchRequestOptions(q, math.MaxInt32, 0, false) results, err := index.Search(searchReq) if err != nil { t.Fatal(err) } if int(results.Total) != numToTest/2 { t.Fatalf("expected %d search hits, got %d", numToTest/2, results.Total) } for _, result := range results.Hits { if _, found := matchingDocIds[result.ID]; !found { t.Fatalf("document with ID %s not in results as expected", result.ID) } } } func TestIndexAdvancedCountMatchSearch(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) index, err := New(tmpIndexPath, NewIndexMapping()) if err != nil { t.Fatal(err) } var wg sync.WaitGroup errChan := make(chan error, 10) for i := 0; i < 10; i++ { wg.Add(1) go func(i int) { defer wg.Done() b := index.NewBatch() for j := 0; j < 200; j++ { id := fmt.Sprintf("%d", (i*200)+j) doc := document.NewDocument(id) doc.AddField(document.NewTextField("body", []uint64{}, []byte("match"))) doc.AddField(document.NewCompositeField("_all", true, []string{}, []string{})) err := b.IndexAdvanced(doc) if err != nil { errChan <- err return } } err := index.Batch(b) if err != nil { errChan <- err return } }(i) } wg.Wait() close(errChan) for err := range errChan { if err != nil { t.Fatal(err) } } // search for something that should match all documents sr, err := index.Search(NewSearchRequest(NewMatchQuery("match"))) if err != nil { t.Fatal(err) } // get the index document count dc, err := index.DocCount() if err != nil { t.Fatal(err) } // make sure test is working correctly, doc count should 2000 if dc != 2000 { t.Errorf("expected doc count 2000, got %d", dc) } // make sure our search found all the documents if dc != sr.Total { t.Errorf("expected search result total %d to match doc count %d", sr.Total, dc) } err = index.Close() if err != nil { t.Fatal(err) } } func benchmarkSearchOverhead(indexType string, b *testing.B) { tmpIndexPath := createTmpIndexPath(b) defer cleanupTmpIndexPath(b, tmpIndexPath) index, err := NewUsing(tmpIndexPath, NewIndexMapping(), indexType, Config.DefaultKVStore, nil) if err != nil { b.Fatal(err) } defer func() { err := index.Close() if err != nil { b.Fatal(err) } }() elements := []string{"air", "water", "fire", "earth"} for j := 0; j < 10000; j++ { err = index.Index(fmt.Sprintf("%d", j), map[string]interface{}{"name": elements[j%len(elements)]}) if err != nil { b.Fatal(err) } } query1 := NewTermQuery("water") query2 := NewTermQuery("fire") query := NewDisjunctionQuery(query1, query2) req := NewSearchRequest(query) b.ResetTimer() for n := 0; n < b.N; n++ { _, err = index.Search(req) if err != nil { b.Fatal(err) } } } func BenchmarkUpsidedownSearchOverhead(b *testing.B) { benchmarkSearchOverhead(upsidedown.Name, b) } func BenchmarkScorchSearchOverhead(b *testing.B) { benchmarkSearchOverhead(scorch.Name, b) } func TestSearchQueryCallback(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) index, err := New(tmpIndexPath, NewIndexMapping()) if err != nil { t.Fatal(err) } defer func() { err := index.Close() if err != nil { t.Fatal(err) } }() query := NewTermQuery("water") req := NewSearchRequest(query) expErr := fmt.Errorf("MEM_LIMIT_EXCEEDED") f := func(size uint64) error { // the intended usage of this callback is to see the estimated // memory usage before executing, and possibly abort early // in this test we simulate returning such an error return expErr } ctx := context.WithValue(context.Background(), SearchQueryStartCallbackKey, SearchQueryStartCallbackFn(f)) _, err = index.SearchInContext(ctx, req) if err != expErr { t.Fatalf("Expected: %v, Got: %v", expErr, err) } } func TestBatchMerge(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) idx, err := New(tmpIndexPath, NewIndexMapping()) if err != nil { t.Fatal(err) } doca := map[string]interface{}{ "name": "scorch", "desc": "gophercon india", "nation": "india", } batchA := idx.NewBatch() err = batchA.Index("a", doca) if err != nil { t.Error(err) } batchA.SetInternal([]byte("batchkA"), []byte("batchvA")) docb := map[string]interface{}{ "name": "moss", "desc": "gophercon MV", } batchB := idx.NewBatch() err = batchB.Index("b", docb) if err != nil { t.Error(err) } batchB.SetInternal([]byte("batchkB"), []byte("batchvB")) docC := map[string]interface{}{ "name": "blahblah", "desc": "inProgress", "country": "usa", } batchC := idx.NewBatch() err = batchC.Index("c", docC) if err != nil { t.Error(err) } batchC.SetInternal([]byte("batchkC"), []byte("batchvC")) batchC.SetInternal([]byte("batchkB"), []byte("batchvBNew")) batchC.Delete("a") batchC.DeleteInternal([]byte("batchkA")) batchA.Merge(batchB) if batchA.Size() != 4 { t.Errorf("expected batch size 4, got %d", batchA.Size()) } batchA.Merge(batchC) if batchA.Size() != 6 { t.Errorf("expected batch size 6, got %d", batchA.Size()) } err = idx.Batch(batchA) if err != nil { t.Fatal(err) } // close the index, open it again, and try some more things err = idx.Close() if err != nil { t.Fatal(err) } idx, err = Open(tmpIndexPath) if err != nil { t.Fatal(err) } defer func() { err := idx.Close() if err != nil { t.Fatal(err) } }() count, err := idx.DocCount() if err != nil { t.Fatal(err) } if count != 2 { t.Errorf("expected doc count 2, got %d", count) } doc, err := idx.Document("c") if err != nil { t.Fatal(err) } val, err := idx.GetInternal([]byte("batchkB")) if err != nil { t.Fatal(err) } if val == nil || string(val) != "batchvBNew" { t.Errorf("expected val: batchvBNew , got %s", val) } val, err = idx.GetInternal([]byte("batchkA")) if err != nil { t.Fatal(err) } if val != nil { t.Errorf("expected nil, got %s", val) } foundNameField := false doc.VisitFields(func(field index.Field) { if field.Name() == "name" && string(field.Value()) == "blahblah" { foundNameField = true } }) if !foundNameField { t.Errorf("expected to find field named 'name' with value 'blahblah'") } fields, err := idx.Fields() if err != nil { t.Fatal(err) } expectedFields := map[string]bool{ "_all": false, "name": false, "desc": false, "country": false, } if len(fields) < len(expectedFields) { t.Fatalf("expected %d fields got %d", len(expectedFields), len(fields)) } for _, f := range fields { expectedFields[f] = true } for ef, efp := range expectedFields { if !efp { t.Errorf("field %s is missing", ef) } } } func TestBug1096(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) // use default mapping mapping := NewIndexMapping() // create a scorch index with default SAFE batches var idx Index idx, err = NewUsing(tmpIndexPath, mapping, "scorch", "scorch", nil) if err != nil { log.Fatal(err) } defer func() { err := idx.Close() if err != nil { t.Fatal(err) } }() // create a single batch instance that we will reuse // this should be safe because we have single goroutine // and we always wait for batch execution to finish batch := idx.NewBatch() // number of batches to execute for i := 0; i < 10; i++ { // number of documents to put into the batch for j := 0; j < 91; j++ { // create a doc id 0-90 (important so that we get id's 9 and 90) // this could duplicate something already in the index // this too should be OK and update the item in the index id := fmt.Sprintf("%d", j) err = batch.Index(id, map[string]interface{}{ "name": id, "batch": fmt.Sprintf("%d", i), }) if err != nil { log.Fatal(err) } } // execute the batch err = idx.Batch(batch) if err != nil { log.Fatal(err) } // reset the batch before reusing it batch.Reset() } // search for docs having name starting with the number 9 q := NewWildcardQuery("9*") q.SetField("name") req := NewSearchRequestOptions(q, 1000, 0, false) req.Fields = []string{"*"} var res *SearchResult res, err = idx.Search(req) if err != nil { log.Fatal(err) } // we expect only 2 hits, for docs 9 and 90 if res.Total > 2 { t.Fatalf("expected only 2 hits '9' and '90', got %v", res) } } func TestDataRaceBug1092(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) // use default mapping mapping := NewIndexMapping() var idx Index idx, err = NewUsing(tmpIndexPath, mapping, upsidedown.Name, boltdb.Name, nil) if err != nil { log.Fatal(err) } defer func() { cerr := idx.Close() if cerr != nil { t.Fatal(cerr) } }() batch := idx.NewBatch() for i := 0; i < 10; i++ { err = idx.Batch(batch) if err != nil { t.Error(err) } batch.Reset() } } func TestBatchRaceBug1149(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) i, err := New(tmpIndexPath, NewIndexMapping()) if err != nil { t.Fatal(err) } defer func() { err := i.Close() if err != nil { t.Fatal(err) } }() testBatchRaceBug1149(t, i) } func TestBatchRaceBug1149Scorch(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) i, err := NewUsing(tmpIndexPath, NewIndexMapping(), "scorch", "scorch", nil) if err != nil { t.Fatal(err) } defer func() { err := i.Close() if err != nil { t.Fatal(err) } }() testBatchRaceBug1149(t, i) } func testBatchRaceBug1149(t *testing.T, i Index) { b := i.NewBatch() b.Delete("1") err = i.Batch(b) if err != nil { t.Fatal(err) } b.Reset() err = i.Batch(b) if err != nil { t.Fatal(err) } b.Reset() } func TestOptimisedConjunctionSearchHits(t *testing.T) { scorch.OptimizeDisjunctionUnadorned = false defer func() { scorch.OptimizeDisjunctionUnadorned = true }() defer func() { err := os.RemoveAll("testidx") if err != nil { t.Fatal(err) } }() idx, err := NewUsing("testidx", NewIndexMapping(), "scorch", "scorch", nil) if err != nil { t.Fatal(err) } doca := map[string]interface{}{ "country": "united", "name": "Mercure Hotel", "directions": "B560 and B56 Follow signs to the M56", } docb := map[string]interface{}{ "country": "united", "name": "Mercure Altrincham Bowdon Hotel", "directions": "A570 and A57 Follow signs to the M56 Manchester Airport", } docc := map[string]interface{}{ "country": "india united", "name": "Sonoma Hotel", "directions": "Northwest", } docd := map[string]interface{}{ "country": "United Kingdom", "name": "Cresta Court Hotel", "directions": "junction of A560 and A56", } b := idx.NewBatch() err = b.Index("a", doca) if err != nil { t.Error(err) } err = b.Index("b", docb) if err != nil { t.Error(err) } err = b.Index("c", docc) if err != nil { t.Error(err) } err = b.Index("d", docd) if err != nil { t.Error(err) } // execute the batch err = idx.Batch(b) if err != nil { log.Fatal(err) } mq := NewMatchQuery("united") mq.SetField("country") cq := NewConjunctionQuery(mq) mq1 := NewMatchQuery("hotel") mq1.SetField("name") cq.AddQuery(mq1) mq2 := NewMatchQuery("56") mq2.SetField("directions") mq2.SetFuzziness(1) cq.AddQuery(mq2) req := NewSearchRequest(cq) req.Score = "none" res, err := idx.Search(req) if err != nil { t.Fatal(err) } hitsWithOutScore := res.Total req = NewSearchRequest(cq) req.Score = "" res, err = idx.Search(req) if err != nil { t.Fatal(err) } hitsWithScore := res.Total if hitsWithOutScore != hitsWithScore { t.Errorf("expected %d hits without score, got %d", hitsWithScore, hitsWithOutScore) } err = idx.Close() if err != nil { t.Fatal(err) } } func TestIndexMappingDocValuesDynamic(t *testing.T) { im := NewIndexMapping() // DocValuesDynamic's default is true // Now explicitly set it to false im.DocValuesDynamic = false // Next, retrieve the JSON dump of the index mapping var data []byte data, err = json.Marshal(im) if err != nil { t.Fatal(err) } // Now, edit an unrelated setting in the index mapping var m map[string]interface{} err = json.Unmarshal(data, &m) if err != nil { t.Fatal(err) } m["index_dynamic"] = false data, err = json.Marshal(m) if err != nil { t.Fatal(err) } // Unmarshal back the changes into the index mapping struct if err = im.UnmarshalJSON(data); err != nil { t.Fatal(err) } // Expect DocValuesDynamic to remain false! if im.DocValuesDynamic { t.Fatalf("Expected DocValuesDynamic to remain false after the index mapping edit") } } func TestCopyIndex(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) idx, err := New(tmpIndexPath, NewIndexMapping()) if err != nil { t.Fatal(err) } defer func() { err := idx.Close() if err != nil { t.Fatal(err) } }() doca := map[string]interface{}{ "name": "tester", "desc": "gophercon india testing", } err = idx.Index("a", doca) if err != nil { t.Error(err) } docy := map[string]interface{}{ "name": "jasper", "desc": "clojure", } err = idx.Index("y", docy) if err != nil { t.Error(err) } err = idx.Delete("y") if err != nil { t.Error(err) } docx := map[string]interface{}{ "name": "rose", "desc": "xoogler", } err = idx.Index("x", docx) if err != nil { t.Error(err) } err = idx.SetInternal([]byte("status"), []byte("pending")) if err != nil { t.Error(err) } docb := map[string]interface{}{ "name": "sree", "desc": "cbft janitor", } batch := idx.NewBatch() err = batch.Index("b", docb) if err != nil { t.Error(err) } batch.Delete("x") batch.SetInternal([]byte("batchi"), []byte("batchv")) batch.DeleteInternal([]byte("status")) err = idx.Batch(batch) if err != nil { t.Error(err) } val, err := idx.GetInternal([]byte("batchi")) if err != nil { t.Error(err) } if string(val) != "batchv" { t.Errorf("expected 'batchv', got '%s'", val) } val, err = idx.GetInternal([]byte("status")) if err != nil { t.Error(err) } if val != nil { t.Errorf("expected nil, got '%s'", val) } err = idx.SetInternal([]byte("seqno"), []byte("7")) if err != nil { t.Error(err) } err = idx.SetInternal([]byte("status"), []byte("ready")) if err != nil { t.Error(err) } err = idx.DeleteInternal([]byte("status")) if err != nil { t.Error(err) } val, err = idx.GetInternal([]byte("status")) if err != nil { t.Error(err) } if val != nil { t.Errorf("expected nil, got '%s'", val) } val, err = idx.GetInternal([]byte("seqno")) if err != nil { t.Error(err) } if string(val) != "7" { t.Errorf("expected '7', got '%s'", val) } count, err := idx.DocCount() if err != nil { t.Fatal(err) } if count != 2 { t.Errorf("expected doc count 2, got %d", count) } doc, err := idx.Document("a") if err != nil { t.Fatal(err) } foundNameField := false doc.VisitFields(func(field index.Field) { if field.Name() == "name" && string(field.Value()) == "tester" { foundNameField = true } }) if !foundNameField { t.Errorf("expected to find field named 'name' with value 'tester'") } fields, err := idx.Fields() if err != nil { t.Fatal(err) } expectedFields := map[string]bool{ "_all": false, "name": false, "desc": false, } if len(fields) < len(expectedFields) { t.Fatalf("expected %d fields got %d", len(expectedFields), len(fields)) } for _, f := range fields { expectedFields[f] = true } for ef, efp := range expectedFields { if !efp { t.Errorf("field %s is missing", ef) } } // now create a copy of the index, and repeat assertions on it copyableIndex, ok := idx.(IndexCopyable) if !ok { t.Fatal("index doesn't support copy") } backupIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, backupIndexPath) err = copyableIndex.CopyTo(FileSystemDirectory(backupIndexPath)) if err != nil { t.Fatalf("error copying the index: %v", err) } // open the copied index idxCopied, err := Open(backupIndexPath) if err != nil { t.Fatalf("unable to open copy index") } defer func() { err := idxCopied.Close() if err != nil { t.Fatalf("error closing copy index: %v", err) } }() // assertions on copied index copyCount, err := idxCopied.DocCount() if err != nil { t.Fatal(err) } if copyCount != 2 { t.Errorf("expected doc count 2, got %d", copyCount) } copyDoc, err := idxCopied.Document("a") if err != nil { t.Fatal(err) } copyFoundNameField := false copyDoc.VisitFields(func(field index.Field) { if field.Name() == "name" && string(field.Value()) == "tester" { copyFoundNameField = true } }) if !copyFoundNameField { t.Errorf("expected copy index to find field named 'name' with value 'tester'") } copyFields, err := idx.Fields() if err != nil { t.Fatal(err) } copyExpectedFields := map[string]bool{ "_all": false, "name": false, "desc": false, } if len(copyFields) < len(copyExpectedFields) { t.Fatalf("expected %d fields got %d", len(copyExpectedFields), len(copyFields)) } for _, f := range copyFields { copyExpectedFields[f] = true } for ef, efp := range copyExpectedFields { if !efp { t.Errorf("copy field %s is missing", ef) } } } func TestFuzzyScoring(t *testing.T) { tmpIndexPath := createTmpIndexPath(t) defer cleanupTmpIndexPath(t, tmpIndexPath) mp := NewIndexMapping() mp.DefaultAnalyzer = "simple" idx, err := New(tmpIndexPath, mp) if err != nil { t.Fatal(err) } batch := idx.NewBatch() docs := []map[string]interface{}{ { "textField": "ab", }, { "textField": "abc", }, { "textField": "abcd", }, } for _, doc := range docs { err := batch.Index(fmt.Sprintf("%v", doc["textField"]), doc) if err != nil { t.Fatal(err) } } err = idx.Batch(batch) if err != nil { t.Fatal(err) } query := NewFuzzyQuery("ab") query.Fuzziness = 2 searchRequest := NewSearchRequestOptions(query, 10, 0, true) res, err := idx.Search(searchRequest) if err != nil { t.Error(err) } maxScore := res.Hits[0].Score for i, hit := range res.Hits { if maxScore/float64(i+1) != hit.Score { t.Errorf("expected score - %f, got score - %f", maxScore/float64(i+1), hit.Score) } } err = idx.Close() if err != nil { t.Fatal(err) } }