2017-01-25 02:43:02 +00:00
|
|
|
// Copyright (c) 2014 Couchbase, Inc.
|
|
|
|
//
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
// you may not use this file except in compliance with the License.
|
|
|
|
// You may obtain a copy of the License at
|
|
|
|
//
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
|
|
|
|
|
|
|
package search
|
|
|
|
|
|
|
|
import (
|
2019-02-18 00:50:26 +00:00
|
|
|
"reflect"
|
2017-01-25 02:43:02 +00:00
|
|
|
"sort"
|
|
|
|
|
2021-01-18 01:21:14 +00:00
|
|
|
"github.com/blevesearch/bleve/v2/size"
|
|
|
|
index "github.com/blevesearch/bleve_index_api"
|
2017-01-25 02:43:02 +00:00
|
|
|
)
|
|
|
|
|
2019-02-18 00:50:26 +00:00
|
|
|
var reflectStaticSizeFacetsBuilder int
|
|
|
|
var reflectStaticSizeFacetResult int
|
|
|
|
var reflectStaticSizeTermFacet int
|
|
|
|
var reflectStaticSizeNumericRangeFacet int
|
|
|
|
var reflectStaticSizeDateRangeFacet int
|
|
|
|
|
|
|
|
func init() {
|
|
|
|
var fb FacetsBuilder
|
|
|
|
reflectStaticSizeFacetsBuilder = int(reflect.TypeOf(fb).Size())
|
|
|
|
var fr FacetResult
|
|
|
|
reflectStaticSizeFacetResult = int(reflect.TypeOf(fr).Size())
|
|
|
|
var tf TermFacet
|
|
|
|
reflectStaticSizeTermFacet = int(reflect.TypeOf(tf).Size())
|
|
|
|
var nrf NumericRangeFacet
|
|
|
|
reflectStaticSizeNumericRangeFacet = int(reflect.TypeOf(nrf).Size())
|
|
|
|
var drf DateRangeFacet
|
|
|
|
reflectStaticSizeDateRangeFacet = int(reflect.TypeOf(drf).Size())
|
|
|
|
}
|
|
|
|
|
2017-01-25 02:43:02 +00:00
|
|
|
type FacetBuilder interface {
|
2017-09-16 20:16:21 +00:00
|
|
|
StartDoc()
|
|
|
|
UpdateVisitor(field string, term []byte)
|
|
|
|
EndDoc()
|
|
|
|
|
2017-01-25 02:43:02 +00:00
|
|
|
Result() *FacetResult
|
|
|
|
Field() string
|
2019-02-18 00:50:26 +00:00
|
|
|
|
|
|
|
Size() int
|
2017-01-25 02:43:02 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
type FacetsBuilder struct {
|
|
|
|
indexReader index.IndexReader
|
2019-02-18 00:50:26 +00:00
|
|
|
facetNames []string
|
|
|
|
facets []FacetBuilder
|
2017-01-25 02:43:02 +00:00
|
|
|
fields []string
|
|
|
|
}
|
|
|
|
|
|
|
|
func NewFacetsBuilder(indexReader index.IndexReader) *FacetsBuilder {
|
|
|
|
return &FacetsBuilder{
|
|
|
|
indexReader: indexReader,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-02-18 00:50:26 +00:00
|
|
|
func (fb *FacetsBuilder) Size() int {
|
|
|
|
sizeInBytes := reflectStaticSizeFacetsBuilder + size.SizeOfPtr
|
|
|
|
|
|
|
|
for k, v := range fb.facets {
|
|
|
|
sizeInBytes += size.SizeOfString + v.Size() + len(fb.facetNames[k])
|
|
|
|
}
|
|
|
|
|
|
|
|
for _, entry := range fb.fields {
|
|
|
|
sizeInBytes += size.SizeOfString + len(entry)
|
|
|
|
}
|
|
|
|
|
|
|
|
return sizeInBytes
|
|
|
|
}
|
|
|
|
|
2017-01-25 02:43:02 +00:00
|
|
|
func (fb *FacetsBuilder) Add(name string, facetBuilder FacetBuilder) {
|
2019-02-18 00:50:26 +00:00
|
|
|
fb.facetNames = append(fb.facetNames, name)
|
|
|
|
fb.facets = append(fb.facets, facetBuilder)
|
2017-09-16 20:16:21 +00:00
|
|
|
fb.fields = append(fb.fields, facetBuilder.Field())
|
2017-01-25 02:43:02 +00:00
|
|
|
}
|
|
|
|
|
2017-09-16 20:16:21 +00:00
|
|
|
func (fb *FacetsBuilder) RequiredFields() []string {
|
|
|
|
return fb.fields
|
|
|
|
}
|
|
|
|
|
|
|
|
func (fb *FacetsBuilder) StartDoc() {
|
|
|
|
for _, facetBuilder := range fb.facets {
|
|
|
|
facetBuilder.StartDoc()
|
2017-01-25 02:43:02 +00:00
|
|
|
}
|
2017-09-16 20:16:21 +00:00
|
|
|
}
|
2017-01-25 02:43:02 +00:00
|
|
|
|
2017-09-16 20:16:21 +00:00
|
|
|
func (fb *FacetsBuilder) EndDoc() {
|
|
|
|
for _, facetBuilder := range fb.facets {
|
|
|
|
facetBuilder.EndDoc()
|
2017-01-25 02:43:02 +00:00
|
|
|
}
|
2017-09-16 20:16:21 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
func (fb *FacetsBuilder) UpdateVisitor(field string, term []byte) {
|
2017-01-25 02:43:02 +00:00
|
|
|
for _, facetBuilder := range fb.facets {
|
2017-09-16 20:16:21 +00:00
|
|
|
facetBuilder.UpdateVisitor(field, term)
|
2017-01-25 02:43:02 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
type TermFacet struct {
|
|
|
|
Term string `json:"term"`
|
|
|
|
Count int `json:"count"`
|
|
|
|
}
|
|
|
|
|
|
|
|
type TermFacets []*TermFacet
|
|
|
|
|
|
|
|
func (tf TermFacets) Add(termFacet *TermFacet) TermFacets {
|
|
|
|
for _, existingTerm := range tf {
|
|
|
|
if termFacet.Term == existingTerm.Term {
|
|
|
|
existingTerm.Count += termFacet.Count
|
|
|
|
return tf
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// if we got here it wasn't already in the existing terms
|
|
|
|
tf = append(tf, termFacet)
|
|
|
|
return tf
|
|
|
|
}
|
|
|
|
|
|
|
|
func (tf TermFacets) Len() int { return len(tf) }
|
|
|
|
func (tf TermFacets) Swap(i, j int) { tf[i], tf[j] = tf[j], tf[i] }
|
|
|
|
func (tf TermFacets) Less(i, j int) bool {
|
|
|
|
if tf[i].Count == tf[j].Count {
|
|
|
|
return tf[i].Term < tf[j].Term
|
|
|
|
}
|
|
|
|
return tf[i].Count > tf[j].Count
|
|
|
|
}
|
|
|
|
|
|
|
|
type NumericRangeFacet struct {
|
|
|
|
Name string `json:"name"`
|
|
|
|
Min *float64 `json:"min,omitempty"`
|
|
|
|
Max *float64 `json:"max,omitempty"`
|
|
|
|
Count int `json:"count"`
|
|
|
|
}
|
|
|
|
|
|
|
|
func (nrf *NumericRangeFacet) Same(other *NumericRangeFacet) bool {
|
|
|
|
if nrf.Min == nil && other.Min != nil {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
if nrf.Min != nil && other.Min == nil {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
if nrf.Min != nil && other.Min != nil && *nrf.Min != *other.Min {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
if nrf.Max == nil && other.Max != nil {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
if nrf.Max != nil && other.Max == nil {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
if nrf.Max != nil && other.Max != nil && *nrf.Max != *other.Max {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
|
|
|
type NumericRangeFacets []*NumericRangeFacet
|
|
|
|
|
|
|
|
func (nrf NumericRangeFacets) Add(numericRangeFacet *NumericRangeFacet) NumericRangeFacets {
|
|
|
|
for _, existingNr := range nrf {
|
|
|
|
if numericRangeFacet.Same(existingNr) {
|
|
|
|
existingNr.Count += numericRangeFacet.Count
|
|
|
|
return nrf
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// if we got here it wasn't already in the existing terms
|
|
|
|
nrf = append(nrf, numericRangeFacet)
|
|
|
|
return nrf
|
|
|
|
}
|
|
|
|
|
|
|
|
func (nrf NumericRangeFacets) Len() int { return len(nrf) }
|
|
|
|
func (nrf NumericRangeFacets) Swap(i, j int) { nrf[i], nrf[j] = nrf[j], nrf[i] }
|
|
|
|
func (nrf NumericRangeFacets) Less(i, j int) bool {
|
|
|
|
if nrf[i].Count == nrf[j].Count {
|
|
|
|
return nrf[i].Name < nrf[j].Name
|
|
|
|
}
|
|
|
|
return nrf[i].Count > nrf[j].Count
|
|
|
|
}
|
|
|
|
|
|
|
|
type DateRangeFacet struct {
|
|
|
|
Name string `json:"name"`
|
|
|
|
Start *string `json:"start,omitempty"`
|
|
|
|
End *string `json:"end,omitempty"`
|
|
|
|
Count int `json:"count"`
|
|
|
|
}
|
|
|
|
|
|
|
|
func (drf *DateRangeFacet) Same(other *DateRangeFacet) bool {
|
|
|
|
if drf.Start == nil && other.Start != nil {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
if drf.Start != nil && other.Start == nil {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
if drf.Start != nil && other.Start != nil && *drf.Start != *other.Start {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
if drf.End == nil && other.End != nil {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
if drf.End != nil && other.End == nil {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
if drf.End != nil && other.End != nil && *drf.End != *other.End {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
|
|
|
type DateRangeFacets []*DateRangeFacet
|
|
|
|
|
|
|
|
func (drf DateRangeFacets) Add(dateRangeFacet *DateRangeFacet) DateRangeFacets {
|
|
|
|
for _, existingDr := range drf {
|
|
|
|
if dateRangeFacet.Same(existingDr) {
|
|
|
|
existingDr.Count += dateRangeFacet.Count
|
|
|
|
return drf
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// if we got here it wasn't already in the existing terms
|
|
|
|
drf = append(drf, dateRangeFacet)
|
|
|
|
return drf
|
|
|
|
}
|
|
|
|
|
|
|
|
func (drf DateRangeFacets) Len() int { return len(drf) }
|
|
|
|
func (drf DateRangeFacets) Swap(i, j int) { drf[i], drf[j] = drf[j], drf[i] }
|
|
|
|
func (drf DateRangeFacets) Less(i, j int) bool {
|
|
|
|
if drf[i].Count == drf[j].Count {
|
|
|
|
return drf[i].Name < drf[j].Name
|
|
|
|
}
|
|
|
|
return drf[i].Count > drf[j].Count
|
|
|
|
}
|
|
|
|
|
|
|
|
type FacetResult struct {
|
|
|
|
Field string `json:"field"`
|
|
|
|
Total int `json:"total"`
|
|
|
|
Missing int `json:"missing"`
|
|
|
|
Other int `json:"other"`
|
|
|
|
Terms TermFacets `json:"terms,omitempty"`
|
|
|
|
NumericRanges NumericRangeFacets `json:"numeric_ranges,omitempty"`
|
|
|
|
DateRanges DateRangeFacets `json:"date_ranges,omitempty"`
|
|
|
|
}
|
|
|
|
|
2019-02-18 00:50:26 +00:00
|
|
|
func (fr *FacetResult) Size() int {
|
|
|
|
return reflectStaticSizeFacetResult + size.SizeOfPtr +
|
|
|
|
len(fr.Field) +
|
|
|
|
len(fr.Terms)*(reflectStaticSizeTermFacet+size.SizeOfPtr) +
|
|
|
|
len(fr.NumericRanges)*(reflectStaticSizeNumericRangeFacet+size.SizeOfPtr) +
|
|
|
|
len(fr.DateRanges)*(reflectStaticSizeDateRangeFacet+size.SizeOfPtr)
|
|
|
|
}
|
|
|
|
|
2017-01-25 02:43:02 +00:00
|
|
|
func (fr *FacetResult) Merge(other *FacetResult) {
|
|
|
|
fr.Total += other.Total
|
|
|
|
fr.Missing += other.Missing
|
|
|
|
fr.Other += other.Other
|
|
|
|
if fr.Terms != nil && other.Terms != nil {
|
|
|
|
for _, term := range other.Terms {
|
|
|
|
fr.Terms = fr.Terms.Add(term)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if fr.NumericRanges != nil && other.NumericRanges != nil {
|
|
|
|
for _, nr := range other.NumericRanges {
|
|
|
|
fr.NumericRanges = fr.NumericRanges.Add(nr)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if fr.DateRanges != nil && other.DateRanges != nil {
|
|
|
|
for _, dr := range other.DateRanges {
|
|
|
|
fr.DateRanges = fr.DateRanges.Add(dr)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (fr *FacetResult) Fixup(size int) {
|
|
|
|
if fr.Terms != nil {
|
|
|
|
sort.Sort(fr.Terms)
|
|
|
|
if len(fr.Terms) > size {
|
|
|
|
moveToOther := fr.Terms[size:]
|
|
|
|
for _, mto := range moveToOther {
|
|
|
|
fr.Other += mto.Count
|
|
|
|
}
|
|
|
|
fr.Terms = fr.Terms[0:size]
|
|
|
|
}
|
|
|
|
} else if fr.NumericRanges != nil {
|
|
|
|
sort.Sort(fr.NumericRanges)
|
|
|
|
if len(fr.NumericRanges) > size {
|
|
|
|
moveToOther := fr.NumericRanges[size:]
|
|
|
|
for _, mto := range moveToOther {
|
|
|
|
fr.Other += mto.Count
|
|
|
|
}
|
|
|
|
fr.NumericRanges = fr.NumericRanges[0:size]
|
|
|
|
}
|
|
|
|
} else if fr.DateRanges != nil {
|
|
|
|
sort.Sort(fr.DateRanges)
|
|
|
|
if len(fr.DateRanges) > size {
|
|
|
|
moveToOther := fr.DateRanges[size:]
|
|
|
|
for _, mto := range moveToOther {
|
|
|
|
fr.Other += mto.Count
|
|
|
|
}
|
|
|
|
fr.DateRanges = fr.DateRanges[0:size]
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
type FacetResults map[string]*FacetResult
|
|
|
|
|
|
|
|
func (fr FacetResults) Merge(other FacetResults) {
|
|
|
|
for name, oFacetResult := range other {
|
|
|
|
facetResult, ok := fr[name]
|
|
|
|
if ok {
|
|
|
|
facetResult.Merge(oFacetResult)
|
|
|
|
} else {
|
|
|
|
fr[name] = oFacetResult
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (fr FacetResults) Fixup(name string, size int) {
|
|
|
|
facetResult, ok := fr[name]
|
|
|
|
if ok {
|
|
|
|
facetResult.Fixup(size)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (fb *FacetsBuilder) Results() FacetResults {
|
|
|
|
fr := make(FacetResults)
|
2019-02-18 00:50:26 +00:00
|
|
|
for i, facetBuilder := range fb.facets {
|
2017-01-25 02:43:02 +00:00
|
|
|
facetResult := facetBuilder.Result()
|
2019-02-18 00:50:26 +00:00
|
|
|
fr[fb.facetNames[i]] = facetResult
|
2017-01-25 02:43:02 +00:00
|
|
|
}
|
|
|
|
return fr
|
|
|
|
}
|