mirror of
https://gitee.com/milvus-io/milvus.git
synced 2024-12-02 20:09:57 +08:00
e1e87d572b
patch search cache param from index configs when index meta could not get the search cache size key #issue: #30113 Signed-off-by: xianliang.li <xianliang.li@zilliz.com>
368 lines
12 KiB
Go
368 lines
12 KiB
Go
// Licensed to the LF AI & Data foundation under one
|
|
// or more contributor license agreements. See the NOTICE file
|
|
// distributed with this work for additional information
|
|
// regarding copyright ownership. The ASF licenses this file
|
|
// to you under the Apache License, Version 2.0 (the
|
|
// "License"); you may not use this file except in compliance
|
|
// with the License. You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
package indexparams
|
|
|
|
import (
|
|
"encoding/json"
|
|
"fmt"
|
|
"strconv"
|
|
"unsafe"
|
|
|
|
"github.com/milvus-io/milvus-proto/go-api/v2/commonpb"
|
|
"github.com/milvus-io/milvus/pkg/common"
|
|
"github.com/milvus-io/milvus/pkg/util/funcutil"
|
|
"github.com/milvus-io/milvus/pkg/util/hardware"
|
|
"github.com/milvus-io/milvus/pkg/util/paramtable"
|
|
"github.com/milvus-io/milvus/pkg/util/typeutil"
|
|
)
|
|
|
|
const (
|
|
PQCodeBudgetRatioKey = "pq_code_budget_gb_ratio"
|
|
NumBuildThreadRatioKey = "num_build_thread_ratio"
|
|
SearchCacheBudgetRatioKey = "search_cache_budget_gb_ratio"
|
|
NumLoadThreadRatioKey = "num_load_thread_ratio"
|
|
BeamWidthRatioKey = "beamwidth_ratio"
|
|
|
|
MaxDegreeKey = "max_degree"
|
|
SearchListSizeKey = "search_list_size"
|
|
PQCodeBudgetKey = "pq_code_budget_gb"
|
|
BuildDramBudgetKey = "build_dram_budget_gb"
|
|
NumBuildThreadKey = "num_build_thread"
|
|
SearchCacheBudgetKey = "search_cache_budget_gb"
|
|
NumLoadThreadKey = "num_load_thread"
|
|
BeamWidthKey = "beamwidth"
|
|
|
|
MaxLoadThread = 64
|
|
MaxBeamWidth = 16
|
|
)
|
|
|
|
var configableIndexParams = typeutil.NewSet[string]()
|
|
|
|
func init() {
|
|
configableIndexParams.Insert(common.MmapEnabledKey)
|
|
}
|
|
|
|
func IsConfigableIndexParam(key string) bool {
|
|
return configableIndexParams.Contain(key)
|
|
}
|
|
|
|
func getRowDataSizeOfFloatVector(numRows int64, dim int64) int64 {
|
|
var floatValue float32
|
|
/* #nosec G103 */
|
|
return int64(unsafe.Sizeof(floatValue)) * dim * numRows
|
|
}
|
|
|
|
type BigDataIndexExtraParams struct {
|
|
PQCodeBudgetGBRatio float64
|
|
BuildNumThreadsRatio float64
|
|
SearchCacheBudgetGBRatio float64
|
|
LoadNumThreadRatio float64
|
|
BeamWidthRatio float64
|
|
}
|
|
|
|
const (
|
|
BuildRatioKey = "build_ratio"
|
|
PrepareRatioKey = "prepare_ratio"
|
|
DefaultPQCodeBudgetGBRatio = 0.125
|
|
DefaultBuildNumThreadsRatio = 1.0
|
|
DefaultSearchCacheBudgetGBRatio = 0.10
|
|
DefaultLoadNumThreadRatio = 8.0
|
|
DefaultBeamWidthRatio = 4.0
|
|
)
|
|
|
|
func NewBigDataExtraParamsFromJSON(jsonStr string) (*BigDataIndexExtraParams, error) {
|
|
buffer, err := funcutil.JSONToMap(jsonStr)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
return NewBigDataExtraParamsFromMap(buffer)
|
|
}
|
|
|
|
func NewBigDataExtraParamsFromMap(value map[string]string) (*BigDataIndexExtraParams, error) {
|
|
ret := &BigDataIndexExtraParams{}
|
|
ret.SearchCacheBudgetGBRatio = DefaultSearchCacheBudgetGBRatio
|
|
setSearchCache := false
|
|
var err error
|
|
buildRatio, ok := value[BuildRatioKey]
|
|
if !ok {
|
|
ret.PQCodeBudgetGBRatio = DefaultPQCodeBudgetGBRatio
|
|
ret.BuildNumThreadsRatio = DefaultBuildNumThreadsRatio
|
|
} else {
|
|
valueMap1 := make(map[string]float64)
|
|
err = json.Unmarshal([]byte(buildRatio), &valueMap1)
|
|
if err != nil {
|
|
return ret, err
|
|
}
|
|
PQCodeBudgetGBRatio, ok := valueMap1["pq_code_budget_gb"]
|
|
if !ok {
|
|
ret.PQCodeBudgetGBRatio = DefaultPQCodeBudgetGBRatio
|
|
} else {
|
|
ret.PQCodeBudgetGBRatio = PQCodeBudgetGBRatio
|
|
}
|
|
BuildNumThreadsRatio, ok := valueMap1["num_threads"]
|
|
if !ok {
|
|
ret.BuildNumThreadsRatio = DefaultBuildNumThreadsRatio
|
|
} else {
|
|
ret.BuildNumThreadsRatio = BuildNumThreadsRatio
|
|
}
|
|
SearchCacheBudgetGBRatio, ok := valueMap1["search_cache_budget_gb"]
|
|
if ok {
|
|
ret.SearchCacheBudgetGBRatio = SearchCacheBudgetGBRatio
|
|
setSearchCache = true
|
|
}
|
|
}
|
|
|
|
prepareRatio, ok := value[PrepareRatioKey]
|
|
if !ok {
|
|
ret.SearchCacheBudgetGBRatio = DefaultSearchCacheBudgetGBRatio
|
|
ret.LoadNumThreadRatio = DefaultLoadNumThreadRatio
|
|
} else {
|
|
valueMap2 := make(map[string]float64)
|
|
err = json.Unmarshal([]byte(prepareRatio), &valueMap2)
|
|
if err != nil {
|
|
return ret, err
|
|
}
|
|
SearchCacheBudgetGBRatio, ok := valueMap2["search_cache_budget_gb"]
|
|
if ok && !setSearchCache {
|
|
ret.SearchCacheBudgetGBRatio = SearchCacheBudgetGBRatio
|
|
}
|
|
LoadNumThreadRatio, ok := valueMap2["num_threads"]
|
|
if !ok {
|
|
ret.LoadNumThreadRatio = DefaultLoadNumThreadRatio
|
|
} else {
|
|
ret.LoadNumThreadRatio = LoadNumThreadRatio
|
|
}
|
|
}
|
|
beamWidthRatioStr, ok := value[BeamWidthRatioKey]
|
|
if !ok {
|
|
ret.BeamWidthRatio = DefaultBeamWidthRatio
|
|
} else {
|
|
beamWidthRatio, err := strconv.ParseFloat(beamWidthRatioStr, 64)
|
|
if err != nil {
|
|
ret.BeamWidthRatio = DefaultBeamWidthRatio
|
|
} else {
|
|
ret.BeamWidthRatio = beamWidthRatio
|
|
}
|
|
}
|
|
|
|
return ret, nil
|
|
}
|
|
|
|
// FillDiskIndexParams fill ratio params to index param on proxy node
|
|
// Which will be used to calculate build and load params
|
|
func FillDiskIndexParams(params *paramtable.ComponentParam, indexParams map[string]string) error {
|
|
var maxDegree string
|
|
var searchListSize string
|
|
var pqCodeBudgetGBRatio string
|
|
var buildNumThreadsRatio string
|
|
var searchCacheBudgetGBRatio string
|
|
|
|
if params.AutoIndexConfig.Enable.GetAsBool() {
|
|
indexParams := params.AutoIndexConfig.IndexParams.GetAsJSONMap()
|
|
var ok bool
|
|
maxDegree, ok = indexParams[MaxDegreeKey]
|
|
if !ok {
|
|
return fmt.Errorf("index param max_degree not exist")
|
|
}
|
|
searchListSize, ok = indexParams[SearchListSizeKey]
|
|
if !ok {
|
|
return fmt.Errorf("index param search_list_size not exist")
|
|
}
|
|
extraParams, err := NewBigDataExtraParamsFromJSON(params.AutoIndexConfig.ExtraParams.GetValue())
|
|
if err != nil {
|
|
return err
|
|
}
|
|
pqCodeBudgetGBRatio = fmt.Sprintf("%f", extraParams.PQCodeBudgetGBRatio)
|
|
buildNumThreadsRatio = fmt.Sprintf("%f", extraParams.BuildNumThreadsRatio)
|
|
searchCacheBudgetGBRatio = fmt.Sprintf("%f", extraParams.SearchCacheBudgetGBRatio)
|
|
} else {
|
|
maxDegree = params.CommonCfg.MaxDegree.GetValue()
|
|
searchListSize = params.CommonCfg.SearchListSize.GetValue()
|
|
pqCodeBudgetGBRatio = params.CommonCfg.PQCodeBudgetGBRatio.GetValue()
|
|
buildNumThreadsRatio = params.CommonCfg.BuildNumThreadsRatio.GetValue()
|
|
searchCacheBudgetGBRatio = params.CommonCfg.SearchCacheBudgetGBRatio.GetValue()
|
|
}
|
|
|
|
indexParams[MaxDegreeKey] = maxDegree
|
|
indexParams[SearchListSizeKey] = searchListSize
|
|
indexParams[PQCodeBudgetRatioKey] = pqCodeBudgetGBRatio
|
|
indexParams[NumBuildThreadRatioKey] = buildNumThreadsRatio
|
|
indexParams[SearchCacheBudgetRatioKey] = searchCacheBudgetGBRatio
|
|
|
|
return nil
|
|
}
|
|
|
|
func GetIndexParams(indexParams []*commonpb.KeyValuePair, key string) string {
|
|
for _, param := range indexParams {
|
|
if param.Key == key {
|
|
return param.Value
|
|
}
|
|
}
|
|
return ""
|
|
}
|
|
|
|
// UpdateDiskIndexBuildParams update index params for `buildIndex` (override search cache size in `CreateIndex`)
|
|
func UpdateDiskIndexBuildParams(params *paramtable.ComponentParam, indexParams []*commonpb.KeyValuePair) ([]*commonpb.KeyValuePair, error) {
|
|
existedVal := GetIndexParams(indexParams, SearchCacheBudgetRatioKey)
|
|
|
|
var searchCacheBudgetGBRatio string
|
|
if params.AutoIndexConfig.Enable.GetAsBool() {
|
|
extraParams, err := NewBigDataExtraParamsFromJSON(params.AutoIndexConfig.ExtraParams.GetValue())
|
|
if err != nil {
|
|
return indexParams, fmt.Errorf("index param search_cache_budget_gb_ratio not exist in AutoIndex Config")
|
|
}
|
|
searchCacheBudgetGBRatio = fmt.Sprintf("%f", extraParams.SearchCacheBudgetGBRatio)
|
|
} else {
|
|
paramVal, err := strconv.ParseFloat(params.CommonCfg.SearchCacheBudgetGBRatio.GetValue(), 64)
|
|
if err != nil {
|
|
return indexParams, fmt.Errorf("index param search_cache_budget_gb_ratio not exist in Config")
|
|
}
|
|
searchCacheBudgetGBRatio = fmt.Sprintf("%f", paramVal)
|
|
}
|
|
|
|
// append when not exist
|
|
if len(existedVal) == 0 {
|
|
indexParams = append(indexParams,
|
|
&commonpb.KeyValuePair{
|
|
Key: SearchCacheBudgetRatioKey,
|
|
Value: searchCacheBudgetGBRatio,
|
|
})
|
|
return indexParams, nil
|
|
}
|
|
// override when exist
|
|
updatedParams := make([]*commonpb.KeyValuePair, 0, len(indexParams))
|
|
for _, param := range indexParams {
|
|
if param.Key == SearchCacheBudgetRatioKey {
|
|
updatedParams = append(updatedParams,
|
|
&commonpb.KeyValuePair{
|
|
Key: SearchCacheBudgetRatioKey,
|
|
Value: searchCacheBudgetGBRatio,
|
|
})
|
|
} else {
|
|
updatedParams = append(updatedParams,
|
|
&commonpb.KeyValuePair{
|
|
Key: param.Key,
|
|
Value: param.Value,
|
|
})
|
|
}
|
|
}
|
|
return updatedParams, nil
|
|
}
|
|
|
|
// SetDiskIndexBuildParams set index build params with ratio params on indexNode
|
|
// IndexNode cal build param with ratio params and cpu count, memory count...
|
|
func SetDiskIndexBuildParams(indexParams map[string]string, fieldDataSize int64) error {
|
|
pqCodeBudgetGBRatioStr, ok := indexParams[PQCodeBudgetRatioKey]
|
|
if !ok {
|
|
return fmt.Errorf("index param pqCodeBudgetGBRatio not exist")
|
|
}
|
|
pqCodeBudgetGBRatio, err := strconv.ParseFloat(pqCodeBudgetGBRatioStr, 64)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
buildNumThreadsRatioStr, ok := indexParams[NumBuildThreadRatioKey]
|
|
if !ok {
|
|
return fmt.Errorf("index param buildNumThreadsRatio not exist")
|
|
}
|
|
buildNumThreadsRatio, err := strconv.ParseFloat(buildNumThreadsRatioStr, 64)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
searchCacheBudgetGBRatioStr, ok := indexParams[SearchCacheBudgetRatioKey]
|
|
// set generate cache size when cache ratio param not set
|
|
if ok {
|
|
SearchCacheBudgetGBRatio, err := strconv.ParseFloat(searchCacheBudgetGBRatioStr, 64)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
indexParams[SearchCacheBudgetKey] = fmt.Sprintf("%f", float32(fieldDataSize)*float32(SearchCacheBudgetGBRatio)/(1<<30))
|
|
}
|
|
indexParams[PQCodeBudgetKey] = fmt.Sprintf("%f", float32(fieldDataSize)*float32(pqCodeBudgetGBRatio)/(1<<30))
|
|
indexParams[NumBuildThreadKey] = strconv.Itoa(int(float32(hardware.GetCPUNum()) * float32(buildNumThreadsRatio)))
|
|
indexParams[BuildDramBudgetKey] = fmt.Sprintf("%f", float32(hardware.GetFreeMemoryCount())/(1<<30))
|
|
return nil
|
|
}
|
|
|
|
// SetDiskIndexLoadParams set disk index load params with ratio params on queryNode
|
|
// QueryNode cal load params with ratio params ans cpu count...
|
|
func SetDiskIndexLoadParams(params *paramtable.ComponentParam, indexParams map[string]string, numRows int64) error {
|
|
dimStr, ok := indexParams[common.DimKey]
|
|
if !ok {
|
|
// type param dim has been put into index params before build index
|
|
return fmt.Errorf("type param dim not exist")
|
|
}
|
|
dim, err := strconv.ParseInt(dimStr, 10, 64)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
var searchCacheBudgetGBRatio float64
|
|
var loadNumThreadRatio float64
|
|
var beamWidthRatio float64
|
|
|
|
if params.AutoIndexConfig.Enable.GetAsBool() {
|
|
extraParams, err := NewBigDataExtraParamsFromJSON(params.AutoIndexConfig.ExtraParams.GetValue())
|
|
if err != nil {
|
|
return err
|
|
}
|
|
searchCacheBudgetGBRatio = extraParams.SearchCacheBudgetGBRatio
|
|
loadNumThreadRatio = extraParams.LoadNumThreadRatio
|
|
beamWidthRatio = extraParams.BeamWidthRatio
|
|
} else {
|
|
searchCacheBudgetGBRatio, err = strconv.ParseFloat(params.CommonCfg.SearchCacheBudgetGBRatio.GetValue(), 64)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
loadNumThreadRatio, err = strconv.ParseFloat(params.CommonCfg.LoadNumThreadRatio.GetValue(), 64)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
beamWidthRatio, err = strconv.ParseFloat(params.CommonCfg.BeamWidthRatio.GetValue(), 64)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
}
|
|
|
|
indexParams[SearchCacheBudgetKey] = fmt.Sprintf("%f",
|
|
float32(getRowDataSizeOfFloatVector(numRows, dim))*float32(searchCacheBudgetGBRatio)/(1<<30))
|
|
|
|
numLoadThread := int(float32(hardware.GetCPUNum()) * float32(loadNumThreadRatio))
|
|
if numLoadThread > MaxLoadThread {
|
|
numLoadThread = MaxLoadThread
|
|
}
|
|
indexParams[NumLoadThreadKey] = strconv.Itoa(numLoadThread)
|
|
|
|
beamWidth := int(float32(hardware.GetCPUNum()) * float32(beamWidthRatio))
|
|
if beamWidth > MaxBeamWidth {
|
|
beamWidth = MaxBeamWidth
|
|
}
|
|
indexParams[BeamWidthKey] = strconv.Itoa(beamWidth)
|
|
|
|
return nil
|
|
}
|
|
|
|
func AppendPrepareLoadParams(params *paramtable.ComponentParam, indexParams map[string]string) error {
|
|
if params.AutoIndexConfig.Enable.GetAsBool() { // `enable` only for cloud instance.
|
|
// override prepare params by
|
|
for k, v := range params.AutoIndexConfig.PrepareParams.GetAsJSONMap() {
|
|
indexParams[k] = v
|
|
}
|
|
}
|
|
return nil
|
|
}
|