2017-09-17 04:16:21 +08:00
|
|
|
// Copyright (c) 2017 Couchbase, Inc.
|
|
|
|
//
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
// you may not use this file except in compliance with the License.
|
|
|
|
// You may obtain a copy of the License at
|
|
|
|
//
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
|
|
|
|
|
|
|
package searcher
|
|
|
|
|
|
|
|
import (
|
|
|
|
"github.com/blevesearch/bleve/document"
|
|
|
|
"github.com/blevesearch/bleve/geo"
|
|
|
|
"github.com/blevesearch/bleve/index"
|
|
|
|
"github.com/blevesearch/bleve/numeric"
|
|
|
|
"github.com/blevesearch/bleve/search"
|
|
|
|
)
|
|
|
|
|
2019-11-27 17:23:33 +08:00
|
|
|
type filterFunc func(key []byte) bool
|
|
|
|
|
2020-09-07 06:51:14 +08:00
|
|
|
var GeoBitsShift1 = geo.GeoBits << 1
|
2019-11-27 17:23:33 +08:00
|
|
|
var GeoBitsShift1Minus1 = GeoBitsShift1 - 1
|
|
|
|
|
2017-09-17 04:16:21 +08:00
|
|
|
func NewGeoBoundingBoxSearcher(indexReader index.IndexReader, minLon, minLat,
|
|
|
|
maxLon, maxLat float64, field string, boost float64,
|
|
|
|
options search.SearcherOptions, checkBoundaries bool) (
|
|
|
|
search.Searcher, error) {
|
|
|
|
|
|
|
|
// track list of opened searchers, for cleanup on early exit
|
|
|
|
var openedSearchers []search.Searcher
|
|
|
|
cleanupOpenedSearchers := func() {
|
|
|
|
for _, s := range openedSearchers {
|
|
|
|
_ = s.Close()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// do math to produce list of terms needed for this search
|
2019-11-27 17:23:33 +08:00
|
|
|
onBoundaryTerms, notOnBoundaryTerms, err := ComputeGeoRange(0, GeoBitsShift1Minus1,
|
|
|
|
minLon, minLat, maxLon, maxLat, checkBoundaries, indexReader, field)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2017-09-17 04:16:21 +08:00
|
|
|
|
|
|
|
var onBoundarySearcher search.Searcher
|
2019-02-18 08:50:26 +08:00
|
|
|
dvReader, err := indexReader.DocValueReader([]string{field})
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2017-09-17 04:16:21 +08:00
|
|
|
if len(onBoundaryTerms) > 0 {
|
|
|
|
rawOnBoundarySearcher, err := NewMultiTermSearcherBytes(indexReader,
|
|
|
|
onBoundaryTerms, field, boost, options, false)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
// add filter to check points near the boundary
|
|
|
|
onBoundarySearcher = NewFilteringSearcher(rawOnBoundarySearcher,
|
2019-02-18 08:50:26 +08:00
|
|
|
buildRectFilter(dvReader, field, minLon, minLat, maxLon, maxLat))
|
2017-09-17 04:16:21 +08:00
|
|
|
openedSearchers = append(openedSearchers, onBoundarySearcher)
|
|
|
|
}
|
|
|
|
|
|
|
|
var notOnBoundarySearcher search.Searcher
|
|
|
|
if len(notOnBoundaryTerms) > 0 {
|
|
|
|
var err error
|
|
|
|
notOnBoundarySearcher, err = NewMultiTermSearcherBytes(indexReader,
|
|
|
|
notOnBoundaryTerms, field, boost, options, false)
|
|
|
|
if err != nil {
|
|
|
|
cleanupOpenedSearchers()
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
openedSearchers = append(openedSearchers, notOnBoundarySearcher)
|
|
|
|
}
|
|
|
|
|
|
|
|
if onBoundarySearcher != nil && notOnBoundarySearcher != nil {
|
|
|
|
rv, err := NewDisjunctionSearcher(indexReader,
|
|
|
|
[]search.Searcher{
|
|
|
|
onBoundarySearcher,
|
|
|
|
notOnBoundarySearcher,
|
|
|
|
},
|
|
|
|
0, options)
|
|
|
|
if err != nil {
|
|
|
|
cleanupOpenedSearchers()
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
return rv, nil
|
|
|
|
} else if onBoundarySearcher != nil {
|
|
|
|
return onBoundarySearcher, nil
|
|
|
|
} else if notOnBoundarySearcher != nil {
|
|
|
|
return notOnBoundarySearcher, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
return NewMatchNoneSearcher(indexReader)
|
|
|
|
}
|
|
|
|
|
|
|
|
var geoMaxShift = document.GeoPrecisionStep * 4
|
|
|
|
var geoDetailLevel = ((geo.GeoBits << 1) - geoMaxShift) / 2
|
2020-09-07 06:51:14 +08:00
|
|
|
type closeFunc func() error
|
2017-09-17 04:16:21 +08:00
|
|
|
|
|
|
|
func ComputeGeoRange(term uint64, shift uint,
|
2019-11-27 17:23:33 +08:00
|
|
|
sminLon, sminLat, smaxLon, smaxLat float64, checkBoundaries bool,
|
|
|
|
indexReader index.IndexReader, field string) (
|
|
|
|
onBoundary [][]byte, notOnBoundary [][]byte, err error) {
|
|
|
|
|
2020-09-07 06:51:14 +08:00
|
|
|
isIndexed, closeF, err := buildIsIndexedFunc(indexReader, field)
|
|
|
|
if closeF != nil {
|
|
|
|
defer func() {
|
|
|
|
cerr := closeF()
|
|
|
|
if cerr != nil {
|
|
|
|
err = cerr
|
|
|
|
}
|
|
|
|
}()
|
|
|
|
}
|
2019-11-27 17:23:33 +08:00
|
|
|
|
2020-09-07 06:51:14 +08:00
|
|
|
grc := &geoRangeCompute{
|
|
|
|
preallocBytesLen: 32,
|
|
|
|
preallocBytes: make([]byte, 32),
|
|
|
|
sminLon: sminLon,
|
|
|
|
sminLat: sminLat,
|
|
|
|
smaxLon: smaxLon,
|
|
|
|
smaxLat: smaxLat,
|
|
|
|
checkBoundaries: checkBoundaries,
|
|
|
|
isIndexed: isIndexed,
|
2019-11-27 17:23:33 +08:00
|
|
|
}
|
|
|
|
|
2020-09-07 06:51:14 +08:00
|
|
|
grc.computeGeoRange(term, shift)
|
|
|
|
|
|
|
|
return grc.onBoundary, grc.notOnBoundary, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func buildIsIndexedFunc(indexReader index.IndexReader, field string) (isIndexed filterFunc, closeF closeFunc, err error) {
|
2019-11-27 17:23:33 +08:00
|
|
|
if irr, ok := indexReader.(index.IndexReaderContains); ok {
|
2020-09-07 06:51:14 +08:00
|
|
|
fieldDict, err := irr.FieldDictContains(field)
|
2019-11-27 17:23:33 +08:00
|
|
|
if err != nil {
|
|
|
|
return nil, nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
isIndexed = func(term []byte) bool {
|
|
|
|
found, err := fieldDict.Contains(term)
|
|
|
|
return err == nil && found
|
|
|
|
}
|
2017-09-17 04:16:21 +08:00
|
|
|
|
2020-09-07 06:51:14 +08:00
|
|
|
closeF = func() error {
|
2019-11-27 17:23:33 +08:00
|
|
|
if fd, ok := fieldDict.(index.FieldDict); ok {
|
2020-09-07 06:51:14 +08:00
|
|
|
err := fd.Close()
|
|
|
|
if err != nil {
|
|
|
|
return err
|
2019-11-27 17:23:33 +08:00
|
|
|
}
|
|
|
|
}
|
2020-09-07 06:51:14 +08:00
|
|
|
return nil
|
2017-09-17 04:16:21 +08:00
|
|
|
}
|
2020-09-07 06:51:14 +08:00
|
|
|
} else if indexReader != nil {
|
2019-11-27 17:23:33 +08:00
|
|
|
isIndexed = func(term []byte) bool {
|
|
|
|
reader, err := indexReader.TermFieldReader(term, field, false, false, false)
|
|
|
|
if err != nil || reader == nil {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
if reader.Count() == 0 {
|
|
|
|
_ = reader.Close()
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
_ = reader.Close()
|
2020-09-07 06:51:14 +08:00
|
|
|
return true
|
2019-11-27 17:23:33 +08:00
|
|
|
}
|
|
|
|
|
2020-09-07 06:51:14 +08:00
|
|
|
} else {
|
|
|
|
isIndexed = func([]byte) bool {
|
|
|
|
return true
|
2019-11-27 17:23:33 +08:00
|
|
|
}
|
|
|
|
}
|
2020-09-07 06:51:14 +08:00
|
|
|
return isIndexed, closeF, err
|
2017-09-17 04:16:21 +08:00
|
|
|
}
|
|
|
|
|
2019-02-18 08:50:26 +08:00
|
|
|
func buildRectFilter(dvReader index.DocValueReader, field string,
|
2017-09-17 04:16:21 +08:00
|
|
|
minLon, minLat, maxLon, maxLat float64) FilterFunc {
|
|
|
|
return func(d *search.DocumentMatch) bool {
|
2020-05-10 13:40:54 +08:00
|
|
|
// check geo matches against all numeric type terms indexed
|
|
|
|
var lons, lats []float64
|
2017-09-17 04:16:21 +08:00
|
|
|
var found bool
|
2019-02-18 08:50:26 +08:00
|
|
|
err := dvReader.VisitDocValues(d.IndexInternalID, func(field string, term []byte) {
|
|
|
|
// only consider the values which are shifted 0
|
|
|
|
prefixCoded := numeric.PrefixCoded(term)
|
|
|
|
shift, err := prefixCoded.Shift()
|
|
|
|
if err == nil && shift == 0 {
|
|
|
|
var i64 int64
|
|
|
|
i64, err = prefixCoded.Int64()
|
|
|
|
if err == nil {
|
2020-05-10 13:40:54 +08:00
|
|
|
lons = append(lons, geo.MortonUnhashLon(uint64(i64)))
|
|
|
|
lats = append(lats, geo.MortonUnhashLat(uint64(i64)))
|
2019-02-18 08:50:26 +08:00
|
|
|
found = true
|
2017-09-17 04:16:21 +08:00
|
|
|
}
|
2019-02-18 08:50:26 +08:00
|
|
|
}
|
|
|
|
})
|
2017-09-17 04:16:21 +08:00
|
|
|
if err == nil && found {
|
2020-05-10 13:40:54 +08:00
|
|
|
for i := range lons {
|
|
|
|
if geo.BoundingBoxContains(lons[i], lats[i],
|
|
|
|
minLon, minLat, maxLon, maxLat) {
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
}
|
2017-09-17 04:16:21 +08:00
|
|
|
}
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
}
|
2020-09-07 06:51:14 +08:00
|
|
|
|
|
|
|
type geoRangeCompute struct {
|
|
|
|
preallocBytesLen int
|
|
|
|
preallocBytes []byte
|
|
|
|
sminLon, sminLat, smaxLon, smaxLat float64
|
|
|
|
checkBoundaries bool
|
|
|
|
onBoundary, notOnBoundary [][]byte
|
|
|
|
isIndexed func(term []byte) bool
|
|
|
|
}
|
|
|
|
|
|
|
|
func (grc *geoRangeCompute) makePrefixCoded(in int64, shift uint) (rv numeric.PrefixCoded) {
|
|
|
|
if len(grc.preallocBytes) <= 0 {
|
|
|
|
grc.preallocBytesLen = grc.preallocBytesLen * 2
|
|
|
|
grc.preallocBytes = make([]byte, grc.preallocBytesLen)
|
|
|
|
}
|
|
|
|
|
|
|
|
rv, grc.preallocBytes, _ =
|
|
|
|
numeric.NewPrefixCodedInt64Prealloc(in, shift, grc.preallocBytes)
|
|
|
|
|
|
|
|
return rv
|
|
|
|
}
|
|
|
|
|
|
|
|
func (grc *geoRangeCompute) computeGeoRange(term uint64, shift uint) {
|
|
|
|
split := term | uint64(0x1)<<shift
|
|
|
|
var upperMax uint64
|
|
|
|
if shift < 63 {
|
|
|
|
upperMax = term | ((uint64(1) << (shift + 1)) - 1)
|
|
|
|
} else {
|
|
|
|
upperMax = 0xffffffffffffffff
|
|
|
|
}
|
|
|
|
lowerMax := split - 1
|
|
|
|
grc.relateAndRecurse(term, lowerMax, shift)
|
|
|
|
grc.relateAndRecurse(split, upperMax, shift)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (grc *geoRangeCompute) relateAndRecurse(start, end uint64, res uint) {
|
|
|
|
minLon := geo.MortonUnhashLon(start)
|
|
|
|
minLat := geo.MortonUnhashLat(start)
|
|
|
|
maxLon := geo.MortonUnhashLon(end)
|
|
|
|
maxLat := geo.MortonUnhashLat(end)
|
|
|
|
|
|
|
|
level := (GeoBitsShift1 - res) >> 1
|
|
|
|
|
|
|
|
within := res%document.GeoPrecisionStep == 0 &&
|
|
|
|
geo.RectWithin(minLon, minLat, maxLon, maxLat,
|
|
|
|
grc.sminLon, grc.sminLat, grc.smaxLon, grc.smaxLat)
|
|
|
|
if within || (level == geoDetailLevel &&
|
|
|
|
geo.RectIntersects(minLon, minLat, maxLon, maxLat,
|
|
|
|
grc.sminLon, grc.sminLat, grc.smaxLon, grc.smaxLat)) {
|
|
|
|
codedTerm := grc.makePrefixCoded(int64(start), res)
|
|
|
|
if grc.isIndexed(codedTerm) {
|
|
|
|
if !within && grc.checkBoundaries {
|
|
|
|
grc.onBoundary = append(grc.onBoundary, codedTerm)
|
|
|
|
} else {
|
|
|
|
grc.notOnBoundary = append(grc.notOnBoundary, codedTerm)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
} else if level < geoDetailLevel &&
|
|
|
|
geo.RectIntersects(minLon, minLat, maxLon, maxLat,
|
|
|
|
grc.sminLon, grc.sminLat, grc.smaxLon, grc.smaxLat) {
|
|
|
|
grc.computeGeoRange(start, res-1)
|
|
|
|
}
|
|
|
|
}
|