2017-01-25 10:43:02 +08:00
|
|
|
// Copyright (c) 2014 Couchbase, Inc.
|
|
|
|
//
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
// you may not use this file except in compliance with the License.
|
|
|
|
// You may obtain a copy of the License at
|
|
|
|
//
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
|
|
|
|
|
|
|
package document
|
|
|
|
|
|
|
|
import (
|
|
|
|
"fmt"
|
2019-02-18 08:50:26 +08:00
|
|
|
"reflect"
|
2017-01-25 10:43:02 +08:00
|
|
|
|
2021-01-18 09:21:14 +08:00
|
|
|
"github.com/blevesearch/bleve/v2/analysis"
|
|
|
|
"github.com/blevesearch/bleve/v2/numeric"
|
|
|
|
"github.com/blevesearch/bleve/v2/size"
|
|
|
|
index "github.com/blevesearch/bleve_index_api"
|
2017-01-25 10:43:02 +08:00
|
|
|
)
|
|
|
|
|
2019-02-18 08:50:26 +08:00
|
|
|
var reflectStaticSizeNumericField int
|
|
|
|
|
|
|
|
func init() {
|
|
|
|
var f NumericField
|
|
|
|
reflectStaticSizeNumericField = int(reflect.TypeOf(f).Size())
|
|
|
|
}
|
|
|
|
|
2021-01-18 09:21:14 +08:00
|
|
|
const DefaultNumericIndexingOptions = index.StoreField | index.IndexField | index.DocValues
|
2017-01-25 10:43:02 +08:00
|
|
|
|
|
|
|
const DefaultPrecisionStep uint = 4
|
|
|
|
|
|
|
|
type NumericField struct {
|
|
|
|
name string
|
|
|
|
arrayPositions []uint64
|
2021-01-18 09:21:14 +08:00
|
|
|
options index.FieldIndexingOptions
|
2017-01-25 10:43:02 +08:00
|
|
|
value numeric.PrefixCoded
|
|
|
|
numPlainTextBytes uint64
|
2021-01-18 09:21:14 +08:00
|
|
|
length int
|
|
|
|
frequencies index.TokenFrequencies
|
2017-01-25 10:43:02 +08:00
|
|
|
}
|
|
|
|
|
2019-02-18 08:50:26 +08:00
|
|
|
func (n *NumericField) Size() int {
|
|
|
|
return reflectStaticSizeNumericField + size.SizeOfPtr +
|
|
|
|
len(n.name) +
|
|
|
|
len(n.arrayPositions)*size.SizeOfPtr
|
|
|
|
}
|
|
|
|
|
2017-01-25 10:43:02 +08:00
|
|
|
func (n *NumericField) Name() string {
|
|
|
|
return n.name
|
|
|
|
}
|
|
|
|
|
|
|
|
func (n *NumericField) ArrayPositions() []uint64 {
|
|
|
|
return n.arrayPositions
|
|
|
|
}
|
|
|
|
|
2021-01-18 09:21:14 +08:00
|
|
|
func (n *NumericField) Options() index.FieldIndexingOptions {
|
2017-01-25 10:43:02 +08:00
|
|
|
return n.options
|
|
|
|
}
|
|
|
|
|
2021-01-18 09:21:14 +08:00
|
|
|
func (n *NumericField) EncodedFieldType() byte {
|
|
|
|
return 'n'
|
|
|
|
}
|
|
|
|
|
|
|
|
func (n *NumericField) AnalyzedLength() int {
|
|
|
|
return n.length
|
|
|
|
}
|
|
|
|
|
|
|
|
func (n *NumericField) AnalyzedTokenFrequencies() index.TokenFrequencies {
|
|
|
|
return n.frequencies
|
|
|
|
}
|
|
|
|
|
|
|
|
func (n *NumericField) Analyze() {
|
2017-01-25 10:43:02 +08:00
|
|
|
tokens := make(analysis.TokenStream, 0)
|
|
|
|
tokens = append(tokens, &analysis.Token{
|
|
|
|
Start: 0,
|
|
|
|
End: len(n.value),
|
|
|
|
Term: n.value,
|
|
|
|
Position: 1,
|
|
|
|
Type: analysis.Numeric,
|
|
|
|
})
|
|
|
|
|
|
|
|
original, err := n.value.Int64()
|
|
|
|
if err == nil {
|
|
|
|
|
|
|
|
shift := DefaultPrecisionStep
|
|
|
|
for shift < 64 {
|
|
|
|
shiftEncoded, err := numeric.NewPrefixCodedInt64(original, shift)
|
|
|
|
if err != nil {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
token := analysis.Token{
|
|
|
|
Start: 0,
|
|
|
|
End: len(shiftEncoded),
|
|
|
|
Term: shiftEncoded,
|
|
|
|
Position: 1,
|
|
|
|
Type: analysis.Numeric,
|
|
|
|
}
|
|
|
|
tokens = append(tokens, &token)
|
|
|
|
shift += DefaultPrecisionStep
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-01-18 09:21:14 +08:00
|
|
|
n.length = len(tokens)
|
|
|
|
n.frequencies = analysis.TokenFrequency(tokens, n.arrayPositions, n.options)
|
2017-01-25 10:43:02 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
func (n *NumericField) Value() []byte {
|
|
|
|
return n.value
|
|
|
|
}
|
|
|
|
|
|
|
|
func (n *NumericField) Number() (float64, error) {
|
|
|
|
i64, err := n.value.Int64()
|
|
|
|
if err != nil {
|
|
|
|
return 0.0, err
|
|
|
|
}
|
|
|
|
return numeric.Int64ToFloat64(i64), nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (n *NumericField) GoString() string {
|
|
|
|
return fmt.Sprintf("&document.NumericField{Name:%s, Options: %s, Value: %s}", n.name, n.options, n.value)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (n *NumericField) NumPlainTextBytes() uint64 {
|
|
|
|
return n.numPlainTextBytes
|
|
|
|
}
|
|
|
|
|
|
|
|
func NewNumericFieldFromBytes(name string, arrayPositions []uint64, value []byte) *NumericField {
|
|
|
|
return &NumericField{
|
|
|
|
name: name,
|
|
|
|
arrayPositions: arrayPositions,
|
|
|
|
value: value,
|
|
|
|
options: DefaultNumericIndexingOptions,
|
|
|
|
numPlainTextBytes: uint64(len(value)),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func NewNumericField(name string, arrayPositions []uint64, number float64) *NumericField {
|
|
|
|
return NewNumericFieldWithIndexingOptions(name, arrayPositions, number, DefaultNumericIndexingOptions)
|
|
|
|
}
|
|
|
|
|
2021-01-18 09:21:14 +08:00
|
|
|
func NewNumericFieldWithIndexingOptions(name string, arrayPositions []uint64, number float64, options index.FieldIndexingOptions) *NumericField {
|
2017-01-25 10:43:02 +08:00
|
|
|
numberInt64 := numeric.Float64ToInt64(number)
|
|
|
|
prefixCoded := numeric.MustNewPrefixCodedInt64(numberInt64, 0)
|
|
|
|
return &NumericField{
|
|
|
|
name: name,
|
|
|
|
arrayPositions: arrayPositions,
|
|
|
|
value: prefixCoded,
|
|
|
|
options: options,
|
|
|
|
// not correct, just a place holder until we revisit how fields are
|
|
|
|
// represented and can fix this better
|
|
|
|
numPlainTextBytes: uint64(8),
|
|
|
|
}
|
|
|
|
}
|