milvus/internal/indexcoord/meta_table.go

1107 lines
34 KiB
Go
Raw Normal View History

// Licensed to the LF AI & Data foundation under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
2021-06-21 17:28:03 +08:00
package indexcoord
import (
"context"
"errors"
"fmt"
"strconv"
"sync"
"github.com/milvus-io/milvus/internal/util/timerecord"
"github.com/prometheus/client_golang/prometheus"
"github.com/golang/protobuf/proto"
"go.uber.org/zap"
"github.com/milvus-io/milvus-proto/go-api/commonpb"
"github.com/milvus-io/milvus/internal/common"
"github.com/milvus-io/milvus/internal/kv"
"github.com/milvus-io/milvus/internal/log"
"github.com/milvus-io/milvus/internal/metastore"
"github.com/milvus-io/milvus/internal/metastore/kv/indexcoord"
"github.com/milvus-io/milvus/internal/metastore/model"
"github.com/milvus-io/milvus/internal/metrics"
"github.com/milvus-io/milvus/internal/proto/indexpb"
)
// metaTable maintains index-related information
type metaTable struct {
catalog metastore.IndexCoordCatalog
indexLock sync.RWMutex
segmentIndexLock sync.RWMutex
// collectionIndexes records which indexes are on the collection
// collID -> indexID -> index
collectionIndexes map[UniqueID]map[UniqueID]*model.Index
// segmentIndexes records which indexes are on the segment
// segID -> indexID -> segmentIndex
segmentIndexes map[UniqueID]map[UniqueID]*model.SegmentIndex
// buildID2Meta records the meta information of the segment
// buildID -> segmentIndex
buildID2SegmentIndex map[UniqueID]*model.SegmentIndex
}
// NewMetaTable is used to create a new meta table.
func NewMetaTable(kv kv.MetaKv) (*metaTable, error) {
mt := &metaTable{
catalog: &indexcoord.Catalog{
Txn: kv,
},
indexLock: sync.RWMutex{},
segmentIndexLock: sync.RWMutex{},
}
err := mt.reloadFromKV()
if err != nil {
return nil, err
}
return mt, nil
}
func (mt *metaTable) updateCollectionIndex(index *model.Index) {
if _, ok := mt.collectionIndexes[index.CollectionID]; !ok {
mt.collectionIndexes[index.CollectionID] = make(map[UniqueID]*model.Index)
}
mt.collectionIndexes[index.CollectionID][index.IndexID] = index
}
func (mt *metaTable) updateSegmentIndex(segIdx *model.SegmentIndex) {
if _, ok := mt.segmentIndexes[segIdx.SegmentID]; !ok {
mt.segmentIndexes[segIdx.SegmentID] = make(map[UniqueID]*model.SegmentIndex)
}
mt.segmentIndexes[segIdx.SegmentID][segIdx.IndexID] = segIdx
mt.buildID2SegmentIndex[segIdx.BuildID] = segIdx
}
// reloadFromKV reloads the index meta from ETCD.
func (mt *metaTable) reloadFromKV() error {
record := timerecord.NewTimeRecorder("indexcoord")
mt.collectionIndexes = make(map[UniqueID]map[UniqueID]*model.Index)
mt.segmentIndexes = make(map[UniqueID]map[UniqueID]*model.SegmentIndex)
mt.buildID2SegmentIndex = make(map[UniqueID]*model.SegmentIndex)
// load field indexes
log.Info("IndexCoord metaTable reloadFromKV load indexes")
fieldIndexes, err := mt.catalog.ListIndexes(context.Background())
if err != nil {
log.Error("IndexCoord metaTable reloadFromKV load field indexes fail", zap.Error(err))
return err
}
segmentIndxes, err := mt.catalog.ListSegmentIndexes(context.Background())
if err != nil {
log.Error("IndexCoord metaTable reloadFromKV load segment indexes fail", zap.Error(err))
return err
}
for _, fieldIndex := range fieldIndexes {
mt.updateCollectionIndex(fieldIndex)
}
for _, segIdx := range segmentIndxes {
mt.updateSegmentIndex(segIdx)
}
log.Info("IndexCoord metaTable reloadFromKV success")
record.Record("metaTable reloadFromKV")
return nil
}
func (mt *metaTable) saveFieldIndexMeta(index *model.Index) error {
err := mt.catalog.CreateIndex(context.Background(), index)
if err != nil {
log.Error("failed to save index meta in etcd", zap.Int64("buildID", index.CollectionID),
zap.Int64("fieldID", index.FieldID), zap.Int64("indexID", index.IndexID), zap.Error(err))
return err
}
mt.updateCollectionIndex(index)
return nil
}
func (mt *metaTable) alterIndexes(indexes []*model.Index) error {
err := mt.catalog.AlterIndexes(context.Background(), indexes)
if err != nil {
log.Error("failed to alter index meta in meta store", zap.Int("indexes num", len(indexes)), zap.Error(err))
return err
}
for _, index := range indexes {
mt.updateCollectionIndex(index)
}
return nil
}
func (mt *metaTable) alterSegmentIndexes(segIdxes []*model.SegmentIndex) error {
err := mt.catalog.AlterSegmentIndexes(context.Background(), segIdxes)
if err != nil {
log.Error("failed to alter segments index in meta store", zap.Int("segment indexes num", len(segIdxes)),
zap.Error(err))
return err
}
for _, segIdx := range segIdxes {
mt.updateSegmentIndex(segIdx)
}
return nil
}
// saveSegmentIndexMeta saves the index meta to ETCD.
// metaTable.lock.Lock() before call this function
func (mt *metaTable) saveSegmentIndexMeta(segIdx *model.SegmentIndex) error {
err := mt.catalog.CreateSegmentIndex(context.Background(), segIdx)
if err != nil {
log.Error("failed to save index meta in etcd", zap.Int64("buildID", segIdx.BuildID), zap.Error(err))
return err
}
mt.updateSegmentIndex(segIdx)
log.Info("IndexCoord metaTable saveIndexMeta success", zap.Int64("buildID", segIdx.BuildID))
return nil
}
func (mt *metaTable) updateIndexMeta(index *model.Index, updateFunc func(clonedIndex *model.Index) error) error {
return updateFunc(model.CloneIndex(index))
}
func (mt *metaTable) updateSegIndexMeta(segIdx *model.SegmentIndex, updateFunc func(clonedSegIdx *model.SegmentIndex) error) error {
return updateFunc(model.CloneSegmentIndex(segIdx))
}
func (mt *metaTable) updateIndexTasksMetrics() {
taskMetrics := make(map[UniqueID]map[commonpb.IndexState]int)
for _, segIdx := range mt.buildID2SegmentIndex {
if segIdx.IsDeleted {
continue
}
if _, ok := taskMetrics[segIdx.CollectionID]; !ok {
taskMetrics[segIdx.CollectionID] = make(map[commonpb.IndexState]int)
taskMetrics[segIdx.CollectionID][commonpb.IndexState_Unissued] = 0
taskMetrics[segIdx.CollectionID][commonpb.IndexState_InProgress] = 0
taskMetrics[segIdx.CollectionID][commonpb.IndexState_Finished] = 0
taskMetrics[segIdx.CollectionID][commonpb.IndexState_Failed] = 0
}
taskMetrics[segIdx.CollectionID][segIdx.IndexState]++
}
for collID, m := range taskMetrics {
for k, v := range m {
switch k {
case commonpb.IndexState_Unissued:
metrics.IndexCoordIndexTaskNum.WithLabelValues(strconv.FormatInt(collID, 10), metrics.UnissuedIndexTaskLabel).Set(float64(v))
case commonpb.IndexState_InProgress:
metrics.IndexCoordIndexTaskNum.WithLabelValues(strconv.FormatInt(collID, 10), metrics.InProgressIndexTaskLabel).Set(float64(v))
case commonpb.IndexState_Finished:
metrics.IndexCoordIndexTaskNum.WithLabelValues(strconv.FormatInt(collID, 10), metrics.FinishedIndexTaskLabel).Set(float64(v))
case commonpb.IndexState_Failed:
metrics.IndexCoordIndexTaskNum.WithLabelValues(strconv.FormatInt(collID, 10), metrics.FailedIndexTaskLabel).Set(float64(v))
}
}
}
}
func (mt *metaTable) GetAllIndexMeta() map[int64]*model.SegmentIndex {
mt.segmentIndexLock.RLock()
defer mt.segmentIndexLock.RUnlock()
metas := map[int64]*model.SegmentIndex{}
for buildID, segIdx := range mt.buildID2SegmentIndex {
metas[buildID] = model.CloneSegmentIndex(segIdx)
}
return metas
}
func (mt *metaTable) GetMeta(buildID UniqueID) (*model.SegmentIndex, bool) {
mt.segmentIndexLock.RLock()
defer mt.segmentIndexLock.RUnlock()
segIdx, ok := mt.buildID2SegmentIndex[buildID]
if ok && !segIdx.IsDeleted {
return model.CloneSegmentIndex(segIdx), true
}
return nil, false
}
func (mt *metaTable) GetTypeParams(collID, indexID UniqueID) []*commonpb.KeyValuePair {
mt.indexLock.RLock()
defer mt.indexLock.RUnlock()
fieldIndexes, ok := mt.collectionIndexes[collID]
if !ok {
return nil
}
index, ok := fieldIndexes[indexID]
if !ok {
return nil
}
typeParams := make([]*commonpb.KeyValuePair, len(index.TypeParams))
for i, param := range index.TypeParams {
typeParams[i] = proto.Clone(param).(*commonpb.KeyValuePair)
}
return typeParams
}
func (mt *metaTable) GetIndexParams(collID, indexID UniqueID) []*commonpb.KeyValuePair {
mt.indexLock.RLock()
defer mt.indexLock.RUnlock()
fieldIndexes, ok := mt.collectionIndexes[collID]
if !ok {
return nil
}
index, ok := fieldIndexes[indexID]
if !ok {
return nil
}
indexParams := make([]*commonpb.KeyValuePair, len(index.IndexParams))
for i, param := range index.IndexParams {
indexParams[i] = proto.Clone(param).(*commonpb.KeyValuePair)
}
return indexParams
}
func (mt *metaTable) CreateIndex(index *model.Index) error {
mt.indexLock.Lock()
defer mt.indexLock.Unlock()
log.Info("IndexCoord metaTable CreateIndex", zap.Int64("collectionID", index.CollectionID),
zap.Int64("fieldID", index.FieldID), zap.Int64("indexID", index.IndexID), zap.String("indexName", index.IndexName))
if err := mt.saveFieldIndexMeta(index); err != nil {
log.Error("IndexCoord metaTable CreateIndex save meta fail", zap.Int64("collectionID", index.CollectionID),
zap.Int64("fieldID", index.FieldID), zap.Int64("indexID", index.IndexID),
zap.String("indexName", index.IndexName), zap.Error(err))
return err
}
log.Info("IndexCoord metaTable CreateIndex success", zap.Int64("collectionID", index.CollectionID),
zap.Int64("fieldID", index.FieldID), zap.Int64("indexID", index.IndexID), zap.String("indexName", index.IndexName))
return nil
}
// AddIndex adds the index meta corresponding the indexBuildID to meta table.
func (mt *metaTable) AddIndex(segIndex *model.SegmentIndex) error {
mt.segmentIndexLock.Lock()
defer mt.segmentIndexLock.Unlock()
buildID := segIndex.BuildID
log.Info("IndexCoord metaTable AddIndex", zap.Int64("collID", segIndex.CollectionID),
zap.Int64("segID", segIndex.SegmentID), zap.Int64("indexID", segIndex.IndexID),
zap.Int64("buildID", buildID))
_, ok := mt.buildID2SegmentIndex[buildID]
if ok {
log.Info("index already exists", zap.Int64("buildID", buildID), zap.Int64("indexID", segIndex.IndexID))
return nil
}
segIndex.IndexState = commonpb.IndexState_Unissued
metrics.IndexCoordIndexTaskNum.WithLabelValues(strconv.FormatInt(segIndex.CollectionID, 10), metrics.UnissuedIndexTaskLabel).Inc()
if err := mt.saveSegmentIndexMeta(segIndex); err != nil {
// no need to reload, no reason to compare version fail
log.Error("IndexCoord metaTable save index meta failed", zap.Int64("buildID", buildID),
zap.Int64("indexID", segIndex.IndexID), zap.Error(err))
return err
}
log.Info("IndexCoord metaTable AddIndex success", zap.Int64("collID", segIndex.CollectionID),
zap.Int64("segID", segIndex.SegmentID), zap.Int64("indexID", segIndex.IndexID),
zap.Int64("buildID", buildID))
return nil
}
func (mt *metaTable) NeedIndex(collID, indexID UniqueID) bool {
mt.indexLock.RLock()
defer mt.indexLock.RUnlock()
fieldIndexes, ok := mt.collectionIndexes[collID]
if !ok {
return false
}
if index, ok := fieldIndexes[indexID]; !ok || index.IsDeleted {
return false
}
return true
}
func (mt *metaTable) canIndex(segIdx *model.SegmentIndex) bool {
if segIdx.IsDeleted {
log.Debug("Index has been deleted", zap.Int64("buildID", segIdx.BuildID))
return false
}
if segIdx.NodeID != 0 {
log.Debug("IndexCoord metaTable BuildIndex, but indexMeta's NodeID is not zero",
zap.Int64("buildID", segIdx.BuildID), zap.Int64("nodeID", segIdx.NodeID))
return false
}
if segIdx.IndexState != commonpb.IndexState_Unissued {
log.Debug("IndexCoord metaTable BuildIndex, but indexMeta's state is not unissued",
zap.Int64("buildID", segIdx.BuildID), zap.String("state", segIdx.IndexState.String()))
return false
}
return true
}
// UpdateVersion updates the version and nodeID of the index meta, whenever the task is built once, the version will be updated once.
func (mt *metaTable) UpdateVersion(buildID UniqueID, nodeID UniqueID) error {
mt.segmentIndexLock.Lock()
defer mt.segmentIndexLock.Unlock()
log.Debug("IndexCoord metaTable UpdateVersion receive", zap.Int64("buildID", buildID), zap.Int64("nodeID", nodeID))
segIdx, ok := mt.buildID2SegmentIndex[buildID]
if !ok {
return fmt.Errorf("there is no index with buildID: %d", buildID)
}
if !mt.canIndex(segIdx) {
return fmt.Errorf("it's no necessary to build index with buildID = %d", buildID)
}
updateFunc := func(segIdx *model.SegmentIndex) error {
segIdx.NodeID = nodeID
segIdx.IndexVersion++
return mt.alterSegmentIndexes([]*model.SegmentIndex{segIdx})
}
return mt.updateSegIndexMeta(segIdx, updateFunc)
}
// BuildIndex set the index state to be InProgress. It means IndexNode is building the index.
func (mt *metaTable) BuildIndex(buildID UniqueID) error {
mt.segmentIndexLock.Lock()
defer mt.segmentIndexLock.Unlock()
segIdx, ok := mt.buildID2SegmentIndex[buildID]
if !ok {
return fmt.Errorf("there is no index with buildID: %d", buildID)
}
updateFunc := func(segIdx *model.SegmentIndex) error {
if segIdx.IsDeleted {
errMsg := fmt.Sprintf("index has been marked deleted, no need to build index with ID: %d", segIdx.BuildID)
log.Warn(errMsg, zap.Int64("BuildID", segIdx.BuildID))
return errors.New(errMsg)
}
if segIdx.IndexState == commonpb.IndexState_Finished || segIdx.IndexState == commonpb.IndexState_Failed {
errMsg := fmt.Sprintf("index has been finished, no need to build index with ID: %d", segIdx.BuildID)
log.Warn(errMsg, zap.Int64("BuildID", segIdx.BuildID), zap.String("state", segIdx.IndexState.String()))
return errors.New(errMsg)
}
segIdx.IndexState = commonpb.IndexState_InProgress
err := mt.alterSegmentIndexes([]*model.SegmentIndex{segIdx})
if err != nil {
log.Error("IndexCoord metaTable BuildIndex fail", zap.Int64("buildID", segIdx.BuildID), zap.Error(err))
return err
}
return nil
}
if err := mt.updateSegIndexMeta(segIdx, updateFunc); err != nil {
return err
}
mt.updateIndexTasksMetrics()
return nil
}
// GetIndexesForCollection gets all indexes info with the specified collection.
func (mt *metaTable) GetIndexesForCollection(collID UniqueID, indexName string) []*model.Index {
mt.indexLock.RLock()
defer mt.indexLock.RUnlock()
indexInfos := make([]*model.Index, 0)
for _, index := range mt.collectionIndexes[collID] {
if index.IsDeleted {
continue
}
if indexName == "" || indexName == index.IndexName {
indexInfos = append(indexInfos, model.CloneIndex(index))
}
}
return indexInfos
}
func (mt *metaTable) CanCreateIndex(req *indexpb.CreateIndexRequest) (bool, error) {
mt.indexLock.RLock()
defer mt.indexLock.RUnlock()
indexes, ok := mt.collectionIndexes[req.CollectionID]
if !ok {
return true, nil
}
for _, index := range indexes {
if index.IsDeleted {
continue
}
if req.IndexName == index.IndexName {
if mt.checkParams(index, req) {
return true, nil
}
errMsg := "at most one distinct index is allowed per field"
log.Warn(errMsg,
zap.String("source index", fmt.Sprintf("{index_name: %s, field_id: %d, index_params: %v, type_params: %v}", index.IndexName, index.FieldID, index.IndexParams, index.TypeParams)),
zap.String("current index", fmt.Sprintf("{index_name: %s, field_id: %d, index_params: %v, type_params: %v}", req.GetIndexName(), req.GetFieldID(), req.GetIndexParams(), req.GetTypeParams())))
return false, fmt.Errorf("CreateIndex failed: %s", errMsg)
}
if req.FieldID == index.FieldID {
// creating multiple indexes on same field is not supported
return false, fmt.Errorf("CreateIndex failed: creating multiple indexes on same field is not supported")
}
}
return true, nil
}
func (mt *metaTable) checkParams(fieldIndex *model.Index, req *indexpb.CreateIndexRequest) bool {
if fieldIndex.IndexName != req.IndexName {
return false
}
if fieldIndex.FieldID != req.FieldID {
return false
}
if len(fieldIndex.TypeParams) != len(req.TypeParams) {
return false
}
notEq := false
for _, param1 := range fieldIndex.TypeParams {
exist := false
for _, param2 := range req.TypeParams {
if param2.Key == param1.Key && param2.Value == param1.Value {
exist = true
}
}
if !exist {
notEq = true
break
}
}
if notEq {
return false
}
if len(fieldIndex.IndexParams) != len(req.IndexParams) {
return false
}
for _, param1 := range fieldIndex.IndexParams {
exist := false
for _, param2 := range req.IndexParams {
if param2.Key == param1.Key && param2.Value == param1.Value {
exist = true
}
}
if !exist {
notEq = true
break
}
}
return !notEq
}
// HasSameReq determine whether there are same indexing tasks.
func (mt *metaTable) HasSameReq(req *indexpb.CreateIndexRequest) (bool, UniqueID) {
mt.indexLock.RLock()
defer mt.indexLock.RUnlock()
for _, fieldIndex := range mt.collectionIndexes[req.CollectionID] {
if fieldIndex.IsDeleted {
continue
}
if !mt.checkParams(fieldIndex, req) {
continue
}
log.Debug("IndexCoord has same index", zap.Int64("collectionID", req.CollectionID),
zap.Int64("fieldID", req.FieldID), zap.String("indexName", req.IndexName),
zap.Int64("indexID", fieldIndex.IndexID))
return true, fieldIndex.IndexID
}
return false, 0
}
func (mt *metaTable) HasSameIndex(segmentID, indexID UniqueID) (bool, UniqueID) {
mt.segmentIndexLock.RLock()
defer mt.segmentIndexLock.RUnlock()
if _, ok := mt.segmentIndexes[segmentID]; !ok {
return false, 0
}
if index, ok := mt.segmentIndexes[segmentID][indexID]; ok {
return true, index.BuildID
}
return false, 0
}
func (mt *metaTable) GetIndexIDByName(collID int64, indexName string) map[int64]uint64 {
mt.indexLock.RLock()
defer mt.indexLock.RUnlock()
indexID2CreateTs := make(map[int64]uint64)
fieldIndexes, ok := mt.collectionIndexes[collID]
if !ok {
return indexID2CreateTs
}
for _, index := range fieldIndexes {
if !index.IsDeleted && (indexName == "" || index.IndexName == indexName) {
indexID2CreateTs[index.IndexID] = index.CreateTime
}
}
return indexID2CreateTs
}
func (mt *metaTable) GetFieldIDByIndexID(collID, indexID UniqueID) UniqueID {
mt.indexLock.RLock()
defer mt.indexLock.RUnlock()
if fieldIndexes, ok := mt.collectionIndexes[collID]; ok {
if index, ok := fieldIndexes[indexID]; ok {
return index.FieldID
}
}
return 0
}
func (mt *metaTable) GetIndexNameByID(collID, indexID UniqueID) string {
mt.indexLock.RLock()
defer mt.indexLock.RUnlock()
if fieldIndexes, ok := mt.collectionIndexes[collID]; ok {
if index, ok := fieldIndexes[indexID]; ok {
return index.IndexName
}
}
return ""
}
type IndexState struct {
state commonpb.IndexState
failReason string
}
type IndexStateCnt struct {
None int
Unissued int
InProgress int
Finished int
Failed int
FailReason string
}
// GetIndexStates gets the index states for indexID from meta table.
func (mt *metaTable) GetIndexStates(indexID int64, createTs uint64) ([]*IndexState, IndexStateCnt) {
mt.segmentIndexLock.RLock()
defer mt.segmentIndexLock.RUnlock()
segIndexStates := make([]*IndexState, 0)
var (
cntNone = 0
cntUnissued = 0
cntInProgress = 0
cntFinished = 0
cntFailed = 0
failReason string
)
for _, indexID2SegIdx := range mt.segmentIndexes {
segIdx, ok := indexID2SegIdx[indexID]
if !ok {
continue
}
if segIdx.CreateTime > createTs {
continue
}
if segIdx.IsDeleted {
// skip deleted index, deleted by compaction
continue
}
switch segIdx.IndexState {
case commonpb.IndexState_IndexStateNone:
cntNone++
case commonpb.IndexState_Unissued:
cntUnissued++
case commonpb.IndexState_InProgress:
cntInProgress++
case commonpb.IndexState_Finished:
cntFinished++
case commonpb.IndexState_Failed:
cntFailed++
failReason += fmt.Sprintf("%d: %s;", segIdx.SegmentID, segIdx.FailReason)
}
segIndexStates = append(segIndexStates, &IndexState{
state: segIdx.IndexState,
failReason: segIdx.FailReason,
})
}
log.Debug("IndexCoord get index states success", zap.Int64("indexID", indexID),
zap.Int("total", len(segIndexStates)), zap.Int("None", cntNone), zap.Int("Unissued", cntUnissued),
zap.Int("InProgress", cntInProgress), zap.Int("Finished", cntFinished), zap.Int("Failed", cntFailed))
return segIndexStates, IndexStateCnt{
None: cntNone,
Unissued: cntNone,
InProgress: cntInProgress,
Finished: cntFinished,
Failed: cntFailed,
FailReason: failReason,
}
}
func (mt *metaTable) GetSegmentIndexes(segID UniqueID) []*model.SegmentIndex {
mt.segmentIndexLock.RLock()
defer mt.segmentIndexLock.RUnlock()
segIndexInfos := make([]*model.SegmentIndex, 0)
if segIndexes, ok := mt.segmentIndexes[segID]; ok {
for _, segIdx := range segIndexes {
if segIdx.IsDeleted {
continue
}
segIndexInfos = append(segIndexInfos, model.CloneSegmentIndex(segIdx))
}
}
return segIndexInfos
}
func (mt *metaTable) GetSegmentIndexState(segmentID UniqueID) IndexState {
mt.segmentIndexLock.RLock()
defer mt.segmentIndexLock.RUnlock()
state := IndexState{
state: commonpb.IndexState_Finished,
failReason: "",
}
if segIdxes, ok := mt.segmentIndexes[segmentID]; ok {
for _, segIdx := range segIdxes {
if segIdx.IsDeleted {
continue
}
if segIdx.IndexState != commonpb.IndexState_Finished {
state.state = segIdx.IndexState
state.failReason = segIdx.FailReason
}
}
}
return state
}
// GetIndexBuildProgress gets the index progress for indexID from meta table.
func (mt *metaTable) GetIndexBuildProgress(indexID int64, segIDs []UniqueID) int64 {
mt.segmentIndexLock.RLock()
defer mt.segmentIndexLock.RUnlock()
indexRows := int64(0)
for _, segID := range segIDs {
segIndexes, ok := mt.segmentIndexes[segID]
if !ok {
continue
}
if segIdx, ok2 := segIndexes[indexID]; ok2 {
if segIdx.IsDeleted {
// partition is dropped, but DataCoord has not received the message
continue
}
// flat index, small segment
if segIdx.IndexState == commonpb.IndexState_Finished {
indexRows += segIdx.NumRows
}
}
}
log.Debug("IndexCoord get index states success", zap.Int64("indexID", indexID),
zap.Int64("indexRows", indexRows))
return indexRows
}
// MarkIndexAsDeleted will mark the corresponding index as deleted, and recycleUnusedIndexFiles will recycle these tasks.
func (mt *metaTable) MarkIndexAsDeleted(collID UniqueID, indexIDs []UniqueID) error {
log.Info("IndexCoord metaTable MarkIndexAsDeleted", zap.Int64("collID", collID),
zap.Int64s("indexIDs", indexIDs))
mt.indexLock.Lock()
defer mt.indexLock.Unlock()
fieldIndexes, ok := mt.collectionIndexes[collID]
if !ok {
return nil
}
indexes := make([]*model.Index, 0)
for _, indexID := range indexIDs {
index, ok := fieldIndexes[indexID]
if !ok || index.IsDeleted {
continue
}
clonedIndex := model.CloneIndex(index)
clonedIndex.IsDeleted = true
indexes = append(indexes, clonedIndex)
}
if len(indexes) == 0 {
return nil
}
err := mt.alterIndexes(indexes)
if err != nil {
log.Error("IndexCoord metaTable MarkIndexAsDeleted fail", zap.Int64("collID", collID),
zap.Int64s("indexIDs", indexIDs), zap.Error(err))
return err
}
log.Info("IndexCoord metaTable MarkIndexAsDeleted success", zap.Int64("collID", collID), zap.Int64s("indexIDs", indexIDs))
return nil
}
// MarkSegmentsIndexAsDeleted will mark the index on the segment corresponding the buildID as deleted, and recycleUnusedSegIndexes will recycle these tasks.
func (mt *metaTable) MarkSegmentsIndexAsDeleted(selector func(index *model.SegmentIndex) bool) error {
mt.segmentIndexLock.Lock()
defer mt.segmentIndexLock.Unlock()
buildIDs := make([]UniqueID, 0)
segIdxes := make([]*model.SegmentIndex, 0)
for _, segIdx := range mt.buildID2SegmentIndex {
if segIdx.IsDeleted {
continue
}
if selector(segIdx) {
clonedSegIdx := model.CloneSegmentIndex(segIdx)
clonedSegIdx.IsDeleted = true
segIdxes = append(segIdxes, clonedSegIdx)
buildIDs = append(buildIDs, segIdx.BuildID)
}
}
if len(segIdxes) == 0 {
log.Debug("IndexCoord metaTable MarkSegmentsIndexAsDeleted success, no segment index need to mark")
return nil
}
err := mt.alterSegmentIndexes(segIdxes)
if err != nil {
return err
}
return nil
}
func (mt *metaTable) GetSegmentIndexByBuildID(buildID UniqueID) (bool, *model.SegmentIndex) {
mt.segmentIndexLock.RLock()
defer mt.segmentIndexLock.RUnlock()
log.Debug("IndexCoord get index file path from meta table", zap.Int64("buildID", buildID))
segIdx, ok := mt.buildID2SegmentIndex[buildID]
if !ok || segIdx.IsDeleted {
return false, nil
}
if segIdx.IndexState != commonpb.IndexState_Finished && segIdx.IndexState != commonpb.IndexState_Failed {
return false, nil
}
log.Debug("IndexCoord get segment index file path success", zap.Int64("buildID", buildID),
zap.Int("index files num", len(segIdx.IndexFileKeys)))
return true, segIdx
}
func (mt *metaTable) IsIndexDeleted(collID, indexID UniqueID) bool {
mt.indexLock.RLock()
defer mt.indexLock.RUnlock()
fieldIndexes, ok := mt.collectionIndexes[collID]
if !ok {
return true
}
if index, ok := fieldIndexes[indexID]; !ok || index.IsDeleted {
return true
}
return false
}
func (mt *metaTable) IsSegIndexDeleted(buildID UniqueID) bool {
mt.segmentIndexLock.RLock()
defer mt.segmentIndexLock.RUnlock()
if segIdx, ok := mt.buildID2SegmentIndex[buildID]; !ok || segIdx.IsDeleted {
return true
}
return false
}
func (mt *metaTable) GetMetasByNodeID(nodeID UniqueID) []*model.SegmentIndex {
mt.segmentIndexLock.RLock()
defer mt.segmentIndexLock.RUnlock()
metas := make([]*model.SegmentIndex, 0)
for _, meta := range mt.buildID2SegmentIndex {
if meta.IsDeleted {
continue
}
if nodeID == meta.NodeID {
metas = append(metas, model.CloneSegmentIndex(meta))
}
}
return metas
}
func (mt *metaTable) GetAllSegIndexes() map[int64]*model.SegmentIndex {
mt.segmentIndexLock.RLock()
defer mt.segmentIndexLock.RUnlock()
segIndexes := make(map[int64]*model.SegmentIndex)
for _, meta := range mt.buildID2SegmentIndex {
segIndexes[meta.SegmentID] = model.CloneSegmentIndex(meta)
}
return segIndexes
}
func (mt *metaTable) GetDeletedIndexes() []*model.Index {
mt.indexLock.RLock()
defer mt.indexLock.RUnlock()
var indexes []*model.Index
for _, fieldIndexes := range mt.collectionIndexes {
for _, index := range fieldIndexes {
if index.IsDeleted {
indexes = append(indexes, model.CloneIndex(index))
}
}
}
return indexes
}
func (mt *metaTable) GetDeletedSegmentIndexes() []*model.SegmentIndex {
mt.segmentIndexLock.RLock()
defer mt.segmentIndexLock.RUnlock()
segIndexes := make([]*model.SegmentIndex, 0)
for _, segIdx := range mt.buildID2SegmentIndex {
if segIdx.IsDeleted {
segIndexes = append(segIndexes, segIdx)
}
}
return segIndexes
}
func (mt *metaTable) GetBuildIDsFromIndexID(indexID UniqueID) []UniqueID {
mt.segmentIndexLock.RLock()
defer mt.segmentIndexLock.RUnlock()
buildIDs := make([]UniqueID, 0)
for buildID, segIdx := range mt.buildID2SegmentIndex {
if segIdx.IndexID == indexID {
buildIDs = append(buildIDs, buildID)
}
}
return buildIDs
}
func (mt *metaTable) GetBuildIDsFromSegIDs(segIDs []UniqueID) []UniqueID {
mt.segmentIndexLock.RLock()
defer mt.segmentIndexLock.RUnlock()
buildIDs := make([]UniqueID, 0)
for _, segID := range segIDs {
if segIdxes, ok := mt.segmentIndexes[segID]; ok {
for _, segIdx := range segIdxes {
buildIDs = append(buildIDs, segIdx.BuildID)
}
}
}
return buildIDs
}
// RemoveIndex remove the index on the collection from meta table.
func (mt *metaTable) RemoveIndex(collID, indexID UniqueID) error {
mt.indexLock.Lock()
defer mt.indexLock.Unlock()
log.Info("IndexCoord meta table remove index", zap.Int64("collID", collID), zap.Int64("indexID", indexID))
err := mt.catalog.DropIndex(context.Background(), collID, indexID)
if err != nil {
log.Info("IndexCoord meta table remove index fail", zap.Int64("collID", collID),
zap.Int64("indexID", indexID), zap.Error(err))
return err
}
delete(mt.collectionIndexes[collID], indexID)
if len(mt.collectionIndexes[collID]) == 0 {
delete(mt.collectionIndexes, collID)
metrics.IndexCoordIndexTaskNum.Delete(prometheus.Labels{"collection_id": strconv.FormatInt(collID, 10), "index_task_status": metrics.UnissuedIndexTaskLabel})
metrics.IndexCoordIndexTaskNum.Delete(prometheus.Labels{"collection_id": strconv.FormatInt(collID, 10), "index_task_status": metrics.InProgressIndexTaskLabel})
metrics.IndexCoordIndexTaskNum.Delete(prometheus.Labels{"collection_id": strconv.FormatInt(collID, 10), "index_task_status": metrics.FinishedIndexTaskLabel})
metrics.IndexCoordIndexTaskNum.Delete(prometheus.Labels{"collection_id": strconv.FormatInt(collID, 10), "index_task_status": metrics.FailedIndexTaskLabel})
}
log.Info("IndexCoord meta table remove index success", zap.Int64("collID", collID), zap.Int64("indexID", indexID))
return nil
}
// RemoveSegmentIndex remove the index on the segment from meta table.
func (mt *metaTable) RemoveSegmentIndex(collID, partID, segID, buildID UniqueID) error {
mt.segmentIndexLock.Lock()
defer mt.segmentIndexLock.Unlock()
err := mt.catalog.DropSegmentIndex(context.Background(), collID, partID, segID, buildID)
if err != nil {
return err
}
segIdx, ok := mt.buildID2SegmentIndex[buildID]
if !ok {
return nil
}
delete(mt.segmentIndexes[segID], segIdx.IndexID)
delete(mt.buildID2SegmentIndex, buildID)
if len(mt.segmentIndexes[segID]) == 0 {
delete(mt.segmentIndexes, segID)
}
return nil
}
// HasBuildID checks if there is an index corresponding the buildID in the meta table.
func (mt *metaTable) HasBuildID(buildID UniqueID) bool {
mt.segmentIndexLock.RLock()
defer mt.segmentIndexLock.RUnlock()
_, ok := mt.buildID2SegmentIndex[buildID]
return ok
}
// ResetNodeID resets the nodeID of the index meta corresponding the buildID.
func (mt *metaTable) ResetNodeID(buildID UniqueID) error {
mt.segmentIndexLock.Lock()
defer mt.segmentIndexLock.Unlock()
updateFunc := func(segIdx *model.SegmentIndex) error {
segIdx.NodeID = 0
return mt.alterSegmentIndexes([]*model.SegmentIndex{segIdx})
}
segIdx, ok := mt.buildID2SegmentIndex[buildID]
if !ok {
return fmt.Errorf("there is no index with buildID: %d", buildID)
}
return mt.updateSegIndexMeta(segIdx, updateFunc)
}
// ResetMeta resets the nodeID and index state of the index meta corresponding the buildID.
func (mt *metaTable) ResetMeta(buildID UniqueID) error {
mt.segmentIndexLock.Lock()
defer mt.segmentIndexLock.Unlock()
segIdx, ok := mt.buildID2SegmentIndex[buildID]
if !ok {
return fmt.Errorf("there is no index with buildID: %d", buildID)
}
updateFunc := func(segIdx *model.SegmentIndex) error {
segIdx.NodeID = 0
segIdx.IndexState = commonpb.IndexState_Unissued
return mt.alterSegmentIndexes([]*model.SegmentIndex{segIdx})
}
if err := mt.updateSegIndexMeta(segIdx, updateFunc); err != nil {
return err
}
mt.updateIndexTasksMetrics()
return nil
}
func (mt *metaTable) FinishTask(taskInfo *indexpb.IndexTaskInfo) error {
mt.segmentIndexLock.Lock()
defer mt.segmentIndexLock.Unlock()
segIdx, ok := mt.buildID2SegmentIndex[taskInfo.BuildID]
if !ok || segIdx.IsDeleted {
return fmt.Errorf("there is no index with buildID: %d", taskInfo.BuildID)
}
updateFunc := func(segIdx *model.SegmentIndex) error {
segIdx.IndexState = taskInfo.State
segIdx.IndexFileKeys = common.CloneStringList(taskInfo.IndexFileKeys)
segIdx.FailReason = taskInfo.FailReason
segIdx.IndexSize = taskInfo.SerializedSize
return mt.alterSegmentIndexes([]*model.SegmentIndex{segIdx})
}
if err := mt.updateSegIndexMeta(segIdx, updateFunc); err != nil {
return err
}
mt.updateIndexTasksMetrics()
log.Info("finish index task success", zap.Int64("buildID", taskInfo.BuildID),
zap.String("state", taskInfo.GetState().String()), zap.String("fail reason", taskInfo.GetFailReason()))
return nil
}
func (mt *metaTable) MarkSegmentsIndexAsDeletedByBuildID(buildIDs []UniqueID) error {
mt.segmentIndexLock.Lock()
defer mt.segmentIndexLock.Unlock()
segIdxes := make([]*model.SegmentIndex, 0)
for _, buildID := range buildIDs {
if segIdx, ok := mt.buildID2SegmentIndex[buildID]; ok {
if segIdx.IsDeleted {
continue
}
clonedSegIdx := model.CloneSegmentIndex(segIdx)
clonedSegIdx.IsDeleted = true
segIdxes = append(segIdxes, clonedSegIdx)
}
}
if len(segIdxes) == 0 {
log.Debug("IndexCoord metaTable MarkSegmentsIndexAsDeletedByBuildID success, already have deleted",
zap.Int64s("buildIDs", buildIDs))
return nil
}
err := mt.alterSegmentIndexes(segIdxes)
if err != nil {
log.Error("IndexCoord metaTable MarkSegmentsIndexAsDeletedByBuildID fail", zap.Int64s("buildIDs", buildIDs), zap.Error(err))
return err
}
log.Info("IndexCoord metaTable MarkSegmentsIndexAsDeletedByBuildID success", zap.Int64s("buildIDs", buildIDs))
return nil
}
func (mt *metaTable) MarkSegmentWriteHandoff(segID UniqueID) error {
mt.segmentIndexLock.Lock()
defer mt.segmentIndexLock.Unlock()
segIdxes := make([]*model.SegmentIndex, 0)
if segIndexes, ok := mt.segmentIndexes[segID]; ok {
for _, segIdx := range segIndexes {
clonedSegIdx := model.CloneSegmentIndex(segIdx)
clonedSegIdx.WriteHandoff = true
segIdxes = append(segIdxes, clonedSegIdx)
}
}
return mt.alterSegmentIndexes(segIdxes)
}
func (mt *metaTable) AlreadyWrittenHandoff(segID UniqueID) bool {
mt.segmentIndexLock.RLock()
defer mt.segmentIndexLock.RUnlock()
if segIndexes, ok := mt.segmentIndexes[segID]; ok {
for _, segIdx := range segIndexes {
if !segIdx.WriteHandoff {
return false
}
}
}
return true
}