mirror of
https://gitee.com/milvus-io/milvus.git
synced 2024-12-10 07:49:29 +08:00
a08a0c831f
issue: #34545 Signed-off-by: jaime <yun.zhang@zilliz.com>
321 lines
9.1 KiB
Go
321 lines
9.1 KiB
Go
// Licensed to the LF AI & Data foundation under one
|
|
// or more contributor license agreements. See the NOTICE file
|
|
// distributed with this work for additional information
|
|
// regarding copyright ownership. The ASF licenses this file
|
|
// to you under the Apache License, Version 2.0 (the
|
|
// "License"); you may not use this file except in compliance
|
|
// with the License. You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
package datacoord
|
|
|
|
import (
|
|
"context"
|
|
"fmt"
|
|
"strconv"
|
|
"strings"
|
|
"time"
|
|
|
|
"github.com/samber/lo"
|
|
"go.uber.org/zap"
|
|
|
|
"github.com/milvus-io/milvus-proto/go-api/v2/commonpb"
|
|
"github.com/milvus-io/milvus-proto/go-api/v2/milvuspb"
|
|
"github.com/milvus-io/milvus/internal/proto/datapb"
|
|
"github.com/milvus-io/milvus/pkg/common"
|
|
"github.com/milvus-io/milvus/pkg/log"
|
|
"github.com/milvus-io/milvus/pkg/metrics"
|
|
"github.com/milvus-io/milvus/pkg/util/funcutil"
|
|
"github.com/milvus-io/milvus/pkg/util/indexparamcheck"
|
|
"github.com/milvus-io/milvus/pkg/util/merr"
|
|
"github.com/milvus-io/milvus/pkg/util/paramtable"
|
|
"github.com/milvus-io/milvus/pkg/util/tsoutil"
|
|
"github.com/milvus-io/milvus/pkg/util/typeutil"
|
|
)
|
|
|
|
// Response response interface for verification
|
|
type Response interface {
|
|
GetStatus() *commonpb.Status
|
|
}
|
|
|
|
// VerifyResponse verify grpc Response 1. check error is nil 2. check response.GetStatus() with status success
|
|
func VerifyResponse(response interface{}, err error) error {
|
|
if err != nil {
|
|
return err
|
|
}
|
|
if response == nil {
|
|
return errNilResponse
|
|
}
|
|
switch resp := response.(type) {
|
|
case Response:
|
|
// note that resp will not be nil here, since it's still an interface
|
|
if resp.GetStatus() == nil {
|
|
return errNilStatusResponse
|
|
}
|
|
return merr.Error(resp.GetStatus())
|
|
|
|
case *commonpb.Status:
|
|
if resp == nil {
|
|
return errNilResponse
|
|
}
|
|
return merr.Error(resp)
|
|
default:
|
|
return errUnknownResponseType
|
|
}
|
|
}
|
|
|
|
func FilterInIndexedSegments(handler Handler, mt *meta, segments ...*SegmentInfo) []*SegmentInfo {
|
|
if len(segments) == 0 {
|
|
return nil
|
|
}
|
|
|
|
collectionSegments := lo.GroupBy(segments, func(segment *SegmentInfo) int64 {
|
|
return segment.GetCollectionID()
|
|
})
|
|
|
|
ret := make([]*SegmentInfo, 0)
|
|
for collection, segmentList := range collectionSegments {
|
|
ctx, cancel := context.WithTimeout(context.Background(), time.Second*2)
|
|
coll, err := handler.GetCollection(ctx, collection)
|
|
cancel()
|
|
if err != nil {
|
|
log.Warn("failed to get collection schema", zap.Error(err))
|
|
continue
|
|
}
|
|
|
|
// get vector field id
|
|
vecFieldIDs := make([]int64, 0)
|
|
for _, field := range coll.Schema.GetFields() {
|
|
if typeutil.IsVectorType(field.GetDataType()) {
|
|
vecFieldIDs = append(vecFieldIDs, field.GetFieldID())
|
|
}
|
|
}
|
|
segmentIDs := lo.Map(segmentList, func(seg *SegmentInfo, _ int) UniqueID {
|
|
return seg.GetID()
|
|
})
|
|
|
|
// get indexed segments which finish build index on all vector field
|
|
indexed := mt.indexMeta.GetIndexedSegments(collection, segmentIDs, vecFieldIDs)
|
|
if len(indexed) > 0 {
|
|
indexedSet := typeutil.NewUniqueSet(indexed...)
|
|
for _, segment := range segmentList {
|
|
if !isFlushState(segment.GetState()) && segment.GetState() != commonpb.SegmentState_Dropped {
|
|
continue
|
|
}
|
|
|
|
if indexedSet.Contain(segment.GetID()) {
|
|
ret = append(ret, segment)
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
return ret
|
|
}
|
|
|
|
func getZeroTime() time.Time {
|
|
var t time.Time
|
|
return t
|
|
}
|
|
|
|
// getCollectionTTL returns ttl if collection's ttl is specified, or return global ttl
|
|
func getCollectionTTL(properties map[string]string) (time.Duration, error) {
|
|
v, ok := properties[common.CollectionTTLConfigKey]
|
|
if ok {
|
|
ttl, err := strconv.Atoi(v)
|
|
if err != nil {
|
|
return -1, err
|
|
}
|
|
return time.Duration(ttl) * time.Second, nil
|
|
}
|
|
|
|
return Params.CommonCfg.EntityExpirationTTL.GetAsDuration(time.Second), nil
|
|
}
|
|
|
|
func UpdateCompactionSegmentSizeMetrics(segments []*datapb.CompactionSegment) {
|
|
var totalSize int64
|
|
for _, seg := range segments {
|
|
totalSize += getCompactedSegmentSize(seg)
|
|
}
|
|
// observe size in bytes
|
|
metrics.DataCoordCompactedSegmentSize.WithLabelValues().Observe(float64(totalSize))
|
|
}
|
|
|
|
func getCompactedSegmentSize(s *datapb.CompactionSegment) int64 {
|
|
var segmentSize int64
|
|
if s != nil {
|
|
for _, binlogs := range s.GetInsertLogs() {
|
|
for _, l := range binlogs.GetBinlogs() {
|
|
segmentSize += l.GetMemorySize()
|
|
}
|
|
}
|
|
|
|
for _, deltaLogs := range s.GetDeltalogs() {
|
|
for _, l := range deltaLogs.GetBinlogs() {
|
|
segmentSize += l.GetMemorySize()
|
|
}
|
|
}
|
|
|
|
for _, statsLogs := range s.GetField2StatslogPaths() {
|
|
for _, l := range statsLogs.GetBinlogs() {
|
|
segmentSize += l.GetMemorySize()
|
|
}
|
|
}
|
|
}
|
|
|
|
return segmentSize
|
|
}
|
|
|
|
// getCollectionAutoCompactionEnabled returns whether auto compaction for collection is enabled.
|
|
// if not set, returns global auto compaction config.
|
|
func getCollectionAutoCompactionEnabled(properties map[string]string) (bool, error) {
|
|
v, ok := properties[common.CollectionAutoCompactionKey]
|
|
if ok {
|
|
enabled, err := strconv.ParseBool(v)
|
|
if err != nil {
|
|
return false, err
|
|
}
|
|
return enabled, nil
|
|
}
|
|
return Params.DataCoordCfg.EnableAutoCompaction.GetAsBool(), nil
|
|
}
|
|
|
|
func GetIndexType(indexParams []*commonpb.KeyValuePair) string {
|
|
for _, param := range indexParams {
|
|
if param.Key == common.IndexTypeKey {
|
|
return param.Value
|
|
}
|
|
}
|
|
return invalidIndex
|
|
}
|
|
|
|
func isFlatIndex(indexType string) bool {
|
|
return indexType == indexparamcheck.IndexFaissIDMap || indexType == indexparamcheck.IndexFaissBinIDMap
|
|
}
|
|
|
|
func isOptionalScalarFieldSupported(indexType string) bool {
|
|
return indexType == indexparamcheck.IndexHNSW
|
|
}
|
|
|
|
func isDiskANNIndex(indexType string) bool {
|
|
return indexType == indexparamcheck.IndexDISKANN
|
|
}
|
|
|
|
func parseBuildIDFromFilePath(key string) (UniqueID, error) {
|
|
ss := strings.Split(key, "/")
|
|
if strings.HasSuffix(key, "/") {
|
|
return strconv.ParseInt(ss[len(ss)-2], 10, 64)
|
|
}
|
|
return strconv.ParseInt(ss[len(ss)-1], 10, 64)
|
|
}
|
|
|
|
func getFieldBinlogs(id UniqueID, binlogs []*datapb.FieldBinlog) *datapb.FieldBinlog {
|
|
for _, binlog := range binlogs {
|
|
if id == binlog.GetFieldID() {
|
|
return binlog
|
|
}
|
|
}
|
|
return nil
|
|
}
|
|
|
|
func mergeFieldBinlogs(currentBinlogs []*datapb.FieldBinlog, newBinlogs []*datapb.FieldBinlog) []*datapb.FieldBinlog {
|
|
for _, newBinlog := range newBinlogs {
|
|
fieldBinlogs := getFieldBinlogs(newBinlog.GetFieldID(), currentBinlogs)
|
|
if fieldBinlogs == nil {
|
|
currentBinlogs = append(currentBinlogs, newBinlog)
|
|
} else {
|
|
fieldBinlogs.Binlogs = append(fieldBinlogs.Binlogs, newBinlog.Binlogs...)
|
|
}
|
|
}
|
|
return currentBinlogs
|
|
}
|
|
|
|
func calculateL0SegmentSize(fields []*datapb.FieldBinlog) float64 {
|
|
size := int64(0)
|
|
for _, field := range fields {
|
|
for _, binlog := range field.GetBinlogs() {
|
|
size += binlog.GetMemorySize()
|
|
}
|
|
}
|
|
return float64(size)
|
|
}
|
|
|
|
func getCompactionMergeInfo(task *datapb.CompactionTask) *milvuspb.CompactionMergeInfo {
|
|
/*
|
|
segments := task.GetPlan().GetSegmentBinlogs()
|
|
var sources []int64
|
|
for _, s := range segments {
|
|
sources = append(sources, s.GetSegmentID())
|
|
}
|
|
*/
|
|
var target int64 = -1
|
|
if len(task.GetResultSegments()) > 0 {
|
|
target = task.GetResultSegments()[0]
|
|
}
|
|
return &milvuspb.CompactionMergeInfo{
|
|
Sources: task.GetInputSegments(),
|
|
Target: target,
|
|
}
|
|
}
|
|
|
|
func getBinLogIDs(segment *SegmentInfo, fieldID int64) []int64 {
|
|
binlogIDs := make([]int64, 0)
|
|
for _, fieldBinLog := range segment.GetBinlogs() {
|
|
if fieldBinLog.GetFieldID() == fieldID {
|
|
for _, binLog := range fieldBinLog.GetBinlogs() {
|
|
binlogIDs = append(binlogIDs, binLog.GetLogID())
|
|
}
|
|
break
|
|
}
|
|
}
|
|
return binlogIDs
|
|
}
|
|
|
|
func CheckCheckPointsHealth(meta *meta) error {
|
|
for channel, cp := range meta.GetChannelCheckpoints() {
|
|
collectionID := funcutil.GetCollectionIDFromVChannel(channel)
|
|
if collectionID == -1 {
|
|
log.RatedWarn(60, "can't parse collection id from vchannel, skip check cp lag", zap.String("vchannel", channel))
|
|
continue
|
|
}
|
|
if meta.GetCollection(collectionID) == nil {
|
|
log.RatedWarn(60, "corresponding the collection doesn't exists, skip check cp lag", zap.String("vchannel", channel))
|
|
continue
|
|
}
|
|
ts, _ := tsoutil.ParseTS(cp.Timestamp)
|
|
lag := time.Since(ts)
|
|
if lag > paramtable.Get().DataCoordCfg.ChannelCheckpointMaxLag.GetAsDuration(time.Second) {
|
|
return merr.WrapErrChannelCPExceededMaxLag(channel, fmt.Sprintf("checkpoint lag: %f(min)", lag.Minutes()))
|
|
}
|
|
}
|
|
return nil
|
|
}
|
|
|
|
func CheckAllChannelsWatched(meta *meta, channelManager ChannelManager) error {
|
|
collIDs := meta.ListCollections()
|
|
for _, collID := range collIDs {
|
|
collInfo := meta.GetCollection(collID)
|
|
if collInfo == nil {
|
|
log.Warn("collection info is nil, skip it", zap.Int64("collectionID", collID))
|
|
continue
|
|
}
|
|
|
|
for _, channelName := range collInfo.VChannelNames {
|
|
_, err := channelManager.FindWatcher(channelName)
|
|
if err != nil {
|
|
log.Warn("find watcher for channel failed", zap.Int64("collectionID", collID),
|
|
zap.String("channelName", channelName), zap.Error(err))
|
|
return err
|
|
}
|
|
}
|
|
}
|
|
return nil
|
|
}
|