2019-02-18 08:50:26 +08:00
|
|
|
// Copyright (c) 2018 Couchbase, Inc.
|
2017-01-24 21:43:02 -05:00
|
|
|
//
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
// you may not use this file except in compliance with the License.
|
|
|
|
// You may obtain a copy of the License at
|
|
|
|
//
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
|
|
|
|
|
|
|
package searcher
|
|
|
|
|
|
|
|
import (
|
|
|
|
"fmt"
|
|
|
|
"github.com/blevesearch/bleve/index"
|
|
|
|
"github.com/blevesearch/bleve/search"
|
|
|
|
)
|
|
|
|
|
|
|
|
// DisjunctionMaxClauseCount is a compile time setting that applications can
|
|
|
|
// adjust to non-zero value to cause the DisjunctionSearcher to return an
|
|
|
|
// error instead of exeucting searches when the size exceeds this value.
|
|
|
|
var DisjunctionMaxClauseCount = 0
|
|
|
|
|
2019-02-18 08:50:26 +08:00
|
|
|
// DisjunctionHeapTakeover is a compile time setting that applications can
|
|
|
|
// adjust to control when the DisjunctionSearcher will switch from a simple
|
|
|
|
// slice implementation to a heap implementation.
|
|
|
|
var DisjunctionHeapTakeover = 10
|
2017-01-24 21:43:02 -05:00
|
|
|
|
2017-09-16 13:16:21 -07:00
|
|
|
func NewDisjunctionSearcher(indexReader index.IndexReader,
|
|
|
|
qsearchers []search.Searcher, min float64, options search.SearcherOptions) (
|
2019-02-18 08:50:26 +08:00
|
|
|
search.Searcher, error) {
|
|
|
|
return newDisjunctionSearcher(indexReader, qsearchers, min, options, true)
|
2017-09-16 13:16:21 -07:00
|
|
|
}
|
|
|
|
|
2020-09-07 06:51:14 +08:00
|
|
|
func optionsDisjunctionOptimizable(options search.SearcherOptions) bool {
|
|
|
|
rv := options.Score == "none" && !options.IncludeTermVectors
|
|
|
|
return rv
|
|
|
|
}
|
|
|
|
|
2017-09-16 13:16:21 -07:00
|
|
|
func newDisjunctionSearcher(indexReader index.IndexReader,
|
|
|
|
qsearchers []search.Searcher, min float64, options search.SearcherOptions,
|
2019-02-18 08:50:26 +08:00
|
|
|
limit bool) (search.Searcher, error) {
|
|
|
|
// attempt the "unadorned" disjunction optimization only when we
|
|
|
|
// do not need extra information like freq-norm's or term vectors
|
|
|
|
// and the requested min is simple
|
|
|
|
if len(qsearchers) > 1 && min <= 1 &&
|
2020-09-07 06:51:14 +08:00
|
|
|
optionsDisjunctionOptimizable(options) {
|
2019-02-18 08:50:26 +08:00
|
|
|
rv, err := optimizeCompositeSearcher("disjunction:unadorned",
|
|
|
|
indexReader, qsearchers, options)
|
|
|
|
if err != nil || rv != nil {
|
|
|
|
return rv, err
|
2017-01-24 21:43:02 -05:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-02-18 08:50:26 +08:00
|
|
|
if len(qsearchers) > DisjunctionHeapTakeover {
|
|
|
|
return newDisjunctionHeapSearcher(indexReader, qsearchers, min, options,
|
|
|
|
limit)
|
2017-01-24 21:43:02 -05:00
|
|
|
}
|
2019-02-18 08:50:26 +08:00
|
|
|
return newDisjunctionSliceSearcher(indexReader, qsearchers, min, options,
|
|
|
|
limit)
|
2017-01-24 21:43:02 -05:00
|
|
|
}
|
|
|
|
|
2019-02-18 08:50:26 +08:00
|
|
|
func optimizeCompositeSearcher(optimizationKind string,
|
|
|
|
indexReader index.IndexReader, qsearchers []search.Searcher,
|
|
|
|
options search.SearcherOptions) (search.Searcher, error) {
|
|
|
|
var octx index.OptimizableContext
|
2017-01-24 21:43:02 -05:00
|
|
|
|
2019-02-18 08:50:26 +08:00
|
|
|
for _, searcher := range qsearchers {
|
|
|
|
o, ok := searcher.(index.Optimizable)
|
|
|
|
if !ok {
|
|
|
|
return nil, nil
|
2017-01-24 21:43:02 -05:00
|
|
|
}
|
|
|
|
|
2019-02-18 08:50:26 +08:00
|
|
|
var err error
|
|
|
|
octx, err = o.Optimize(optimizationKind, octx)
|
2017-01-24 21:43:02 -05:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2019-02-18 08:50:26 +08:00
|
|
|
if octx == nil {
|
|
|
|
return nil, nil
|
2017-01-24 21:43:02 -05:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-02-18 08:50:26 +08:00
|
|
|
optimized, err := octx.Finish()
|
|
|
|
if err != nil || optimized == nil {
|
2017-01-24 21:43:02 -05:00
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2019-02-18 08:50:26 +08:00
|
|
|
tfr, ok := optimized.(index.TermFieldReader)
|
|
|
|
if !ok {
|
|
|
|
return nil, nil
|
2017-01-24 21:43:02 -05:00
|
|
|
}
|
|
|
|
|
2019-02-18 08:50:26 +08:00
|
|
|
return newTermSearcherFromReader(indexReader, tfr,
|
|
|
|
[]byte(optimizationKind), "*", 1.0, options)
|
2017-01-24 21:43:02 -05:00
|
|
|
}
|
|
|
|
|
2019-02-18 08:50:26 +08:00
|
|
|
func tooManyClauses(count int) bool {
|
|
|
|
if DisjunctionMaxClauseCount != 0 && count > DisjunctionMaxClauseCount {
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
return false
|
2017-01-24 21:43:02 -05:00
|
|
|
}
|
|
|
|
|
2020-09-07 06:51:14 +08:00
|
|
|
func tooManyClausesErr(field string, count int) error {
|
|
|
|
return fmt.Errorf("TooManyClauses over field: `%s` [%d > maxClauseCount,"+
|
|
|
|
" which is set to %d]", field, count, DisjunctionMaxClauseCount)
|
2017-01-24 21:43:02 -05:00
|
|
|
}
|