// Licensed to the LF AI & Data foundation under one // or more contributor license agreements. See the NOTICE file // distributed with this work for additional information // regarding copyright ownership. The ASF licenses this file // to you under the Apache License, Version 2.0 (the // "License"); you may not use this file except in compliance // with the License. You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. package datacoord import ( "context" "strconv" "strings" "time" "github.com/samber/lo" "go.uber.org/zap" "github.com/milvus-io/milvus-proto/go-api/v2/commonpb" "github.com/milvus-io/milvus/internal/proto/datapb" "github.com/milvus-io/milvus/pkg/common" "github.com/milvus-io/milvus/pkg/log" "github.com/milvus-io/milvus/pkg/metrics" "github.com/milvus-io/milvus/pkg/util/indexparamcheck" "github.com/milvus-io/milvus/pkg/util/merr" "github.com/milvus-io/milvus/pkg/util/typeutil" ) // Response response interface for verification type Response interface { GetStatus() *commonpb.Status } // VerifyResponse verify grpc Response 1. check error is nil 2. check response.GetStatus() with status success func VerifyResponse(response interface{}, err error) error { if err != nil { return err } if response == nil { return errNilResponse } switch resp := response.(type) { case Response: // note that resp will not be nil here, since it's still an interface if resp.GetStatus() == nil { return errNilStatusResponse } return merr.Error(resp.GetStatus()) case *commonpb.Status: if resp == nil { return errNilResponse } return merr.Error(resp) default: return errUnknownResponseType } } func FilterInIndexedSegments(handler Handler, mt *meta, segments ...*SegmentInfo) []*SegmentInfo { if len(segments) == 0 { return nil } collectionSegments := lo.GroupBy(segments, func(segment *SegmentInfo) int64 { return segment.GetCollectionID() }) ret := make([]*SegmentInfo, 0) for collection, segmentList := range collectionSegments { ctx, cancel := context.WithTimeout(context.Background(), time.Second*2) coll, err := handler.GetCollection(ctx, collection) cancel() if err != nil { log.Warn("failed to get collection schema", zap.Error(err)) continue } // get vector field id vecFieldIDs := make([]int64, 0) for _, field := range coll.Schema.GetFields() { if typeutil.IsVectorType(field.GetDataType()) { vecFieldIDs = append(vecFieldIDs, field.GetFieldID()) } } segmentIDs := lo.Map(segmentList, func(seg *SegmentInfo, _ int) UniqueID { return seg.GetID() }) // get indexed segments which finish build index on all vector field indexed := mt.indexMeta.GetIndexedSegments(collection, segmentIDs, vecFieldIDs) if len(indexed) > 0 { indexedSet := typeutil.NewUniqueSet(indexed...) for _, segment := range segmentList { if !isFlushState(segment.GetState()) && segment.GetState() != commonpb.SegmentState_Dropped { continue } if indexedSet.Contain(segment.GetID()) { ret = append(ret, segment) } } } } return ret } func getZeroTime() time.Time { var t time.Time return t } // getCollectionTTL returns ttl if collection's ttl is specified, or return global ttl func getCollectionTTL(properties map[string]string) (time.Duration, error) { v, ok := properties[common.CollectionTTLConfigKey] if ok { ttl, err := strconv.Atoi(v) if err != nil { return -1, err } return time.Duration(ttl) * time.Second, nil } return Params.CommonCfg.EntityExpirationTTL.GetAsDuration(time.Second), nil } func UpdateCompactionSegmentSizeMetrics(segments []*datapb.CompactionSegment) { var totalSize int64 for _, seg := range segments { totalSize += getCompactedSegmentSize(seg) } // observe size in bytes metrics.DataCoordCompactedSegmentSize.WithLabelValues().Observe(float64(totalSize)) } func getCompactedSegmentSize(s *datapb.CompactionSegment) int64 { var segmentSize int64 if s != nil { for _, binlogs := range s.GetInsertLogs() { for _, l := range binlogs.GetBinlogs() { segmentSize += l.GetMemorySize() } } for _, deltaLogs := range s.GetDeltalogs() { for _, l := range deltaLogs.GetBinlogs() { segmentSize += l.GetMemorySize() } } for _, statsLogs := range s.GetField2StatslogPaths() { for _, l := range statsLogs.GetBinlogs() { segmentSize += l.GetMemorySize() } } } return segmentSize } // getCollectionAutoCompactionEnabled returns whether auto compaction for collection is enabled. // if not set, returns global auto compaction config. func getCollectionAutoCompactionEnabled(properties map[string]string) (bool, error) { v, ok := properties[common.CollectionAutoCompactionKey] if ok { enabled, err := strconv.ParseBool(v) if err != nil { return false, err } return enabled, nil } return Params.DataCoordCfg.EnableAutoCompaction.GetAsBool(), nil } func GetIndexType(indexParams []*commonpb.KeyValuePair) string { for _, param := range indexParams { if param.Key == common.IndexTypeKey { return param.Value } } return invalidIndex } func isFlatIndex(indexType string) bool { return indexType == indexparamcheck.IndexFaissIDMap || indexType == indexparamcheck.IndexFaissBinIDMap } func isDiskANNIndex(indexType string) bool { return indexType == indexparamcheck.IndexDISKANN } func parseBuildIDFromFilePath(key string) (UniqueID, error) { ss := strings.Split(key, "/") if strings.HasSuffix(key, "/") { return strconv.ParseInt(ss[len(ss)-2], 10, 64) } return strconv.ParseInt(ss[len(ss)-1], 10, 64) } func getFieldBinlogs(id UniqueID, binlogs []*datapb.FieldBinlog) *datapb.FieldBinlog { for _, binlog := range binlogs { if id == binlog.GetFieldID() { return binlog } } return nil } func mergeFieldBinlogs(currentBinlogs []*datapb.FieldBinlog, newBinlogs []*datapb.FieldBinlog) []*datapb.FieldBinlog { for _, newBinlog := range newBinlogs { fieldBinlogs := getFieldBinlogs(newBinlog.GetFieldID(), currentBinlogs) if fieldBinlogs == nil { currentBinlogs = append(currentBinlogs, newBinlog) } else { fieldBinlogs.Binlogs = append(fieldBinlogs.Binlogs, newBinlog.Binlogs...) } } return currentBinlogs } func calculateL0SegmentSize(fields []*datapb.FieldBinlog) float64 { size := int64(0) for _, field := range fields { for _, binlog := range field.GetBinlogs() { size += binlog.GetMemorySize() } } return float64(size) }