You can not select more than 25 topics
			Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
		
		
		
		
		
			
		
			
				
					
					
						
							145 lines
						
					
					
						
							3.8 KiB
						
					
					
				
			
		
		
	
	
							145 lines
						
					
					
						
							3.8 KiB
						
					
					
				| //  Copyright (c) 2014 Couchbase, Inc.
 | |
| //
 | |
| // Licensed under the Apache License, Version 2.0 (the "License");
 | |
| // you may not use this file except in compliance with the License.
 | |
| // You may obtain a copy of the License at
 | |
| //
 | |
| // 		http://www.apache.org/licenses/LICENSE-2.0
 | |
| //
 | |
| // Unless required by applicable law or agreed to in writing, software
 | |
| // distributed under the License is distributed on an "AS IS" BASIS,
 | |
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | |
| // See the License for the specific language governing permissions and
 | |
| // limitations under the License.
 | |
| 
 | |
| package document
 | |
| 
 | |
| import (
 | |
| 	"fmt"
 | |
| 	"reflect"
 | |
| 
 | |
| 	"github.com/blevesearch/bleve/analysis"
 | |
| 	"github.com/blevesearch/bleve/numeric"
 | |
| 	"github.com/blevesearch/bleve/size"
 | |
| )
 | |
| 
 | |
| var reflectStaticSizeNumericField int
 | |
| 
 | |
| func init() {
 | |
| 	var f NumericField
 | |
| 	reflectStaticSizeNumericField = int(reflect.TypeOf(f).Size())
 | |
| }
 | |
| 
 | |
| const DefaultNumericIndexingOptions = StoreField | IndexField | DocValues
 | |
| 
 | |
| const DefaultPrecisionStep uint = 4
 | |
| 
 | |
| type NumericField struct {
 | |
| 	name              string
 | |
| 	arrayPositions    []uint64
 | |
| 	options           IndexingOptions
 | |
| 	value             numeric.PrefixCoded
 | |
| 	numPlainTextBytes uint64
 | |
| }
 | |
| 
 | |
| func (n *NumericField) Size() int {
 | |
| 	return reflectStaticSizeNumericField + size.SizeOfPtr +
 | |
| 		len(n.name) +
 | |
| 		len(n.arrayPositions)*size.SizeOfPtr
 | |
| }
 | |
| 
 | |
| func (n *NumericField) Name() string {
 | |
| 	return n.name
 | |
| }
 | |
| 
 | |
| func (n *NumericField) ArrayPositions() []uint64 {
 | |
| 	return n.arrayPositions
 | |
| }
 | |
| 
 | |
| func (n *NumericField) Options() IndexingOptions {
 | |
| 	return n.options
 | |
| }
 | |
| 
 | |
| func (n *NumericField) Analyze() (int, analysis.TokenFrequencies) {
 | |
| 	tokens := make(analysis.TokenStream, 0)
 | |
| 	tokens = append(tokens, &analysis.Token{
 | |
| 		Start:    0,
 | |
| 		End:      len(n.value),
 | |
| 		Term:     n.value,
 | |
| 		Position: 1,
 | |
| 		Type:     analysis.Numeric,
 | |
| 	})
 | |
| 
 | |
| 	original, err := n.value.Int64()
 | |
| 	if err == nil {
 | |
| 
 | |
| 		shift := DefaultPrecisionStep
 | |
| 		for shift < 64 {
 | |
| 			shiftEncoded, err := numeric.NewPrefixCodedInt64(original, shift)
 | |
| 			if err != nil {
 | |
| 				break
 | |
| 			}
 | |
| 			token := analysis.Token{
 | |
| 				Start:    0,
 | |
| 				End:      len(shiftEncoded),
 | |
| 				Term:     shiftEncoded,
 | |
| 				Position: 1,
 | |
| 				Type:     analysis.Numeric,
 | |
| 			}
 | |
| 			tokens = append(tokens, &token)
 | |
| 			shift += DefaultPrecisionStep
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	fieldLength := len(tokens)
 | |
| 	tokenFreqs := analysis.TokenFrequency(tokens, n.arrayPositions, n.options.IncludeTermVectors())
 | |
| 	return fieldLength, tokenFreqs
 | |
| }
 | |
| 
 | |
| func (n *NumericField) Value() []byte {
 | |
| 	return n.value
 | |
| }
 | |
| 
 | |
| func (n *NumericField) Number() (float64, error) {
 | |
| 	i64, err := n.value.Int64()
 | |
| 	if err != nil {
 | |
| 		return 0.0, err
 | |
| 	}
 | |
| 	return numeric.Int64ToFloat64(i64), nil
 | |
| }
 | |
| 
 | |
| func (n *NumericField) GoString() string {
 | |
| 	return fmt.Sprintf("&document.NumericField{Name:%s, Options: %s, Value: %s}", n.name, n.options, n.value)
 | |
| }
 | |
| 
 | |
| func (n *NumericField) NumPlainTextBytes() uint64 {
 | |
| 	return n.numPlainTextBytes
 | |
| }
 | |
| 
 | |
| func NewNumericFieldFromBytes(name string, arrayPositions []uint64, value []byte) *NumericField {
 | |
| 	return &NumericField{
 | |
| 		name:              name,
 | |
| 		arrayPositions:    arrayPositions,
 | |
| 		value:             value,
 | |
| 		options:           DefaultNumericIndexingOptions,
 | |
| 		numPlainTextBytes: uint64(len(value)),
 | |
| 	}
 | |
| }
 | |
| 
 | |
| func NewNumericField(name string, arrayPositions []uint64, number float64) *NumericField {
 | |
| 	return NewNumericFieldWithIndexingOptions(name, arrayPositions, number, DefaultNumericIndexingOptions)
 | |
| }
 | |
| 
 | |
| func NewNumericFieldWithIndexingOptions(name string, arrayPositions []uint64, number float64, options IndexingOptions) *NumericField {
 | |
| 	numberInt64 := numeric.Float64ToInt64(number)
 | |
| 	prefixCoded := numeric.MustNewPrefixCodedInt64(numberInt64, 0)
 | |
| 	return &NumericField{
 | |
| 		name:           name,
 | |
| 		arrayPositions: arrayPositions,
 | |
| 		value:          prefixCoded,
 | |
| 		options:        options,
 | |
| 		// not correct, just a place holder until we revisit how fields are
 | |
| 		// represented and can fix this better
 | |
| 		numPlainTextBytes: uint64(8),
 | |
| 	}
 | |
| }
 | |
| 
 |