mirror of
https://gitee.com/milvus-io/milvus.git
synced 2024-12-02 11:59:00 +08:00
2512dff261
Signed-off-by: cai.zhang <cai.zhang@zilliz.com>
604 lines
19 KiB
Go
604 lines
19 KiB
Go
// Licensed to the LF AI & Data foundation under one
|
|
// or more contributor license agreements. See the NOTICE file
|
|
// distributed with this work for additional information
|
|
// regarding copyright ownership. The ASF licenses this file
|
|
// to you under the Apache License, Version 2.0 (the
|
|
// "License"); you may not use this file except in compliance
|
|
// with the License. You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
package indexnode
|
|
|
|
import (
|
|
"context"
|
|
"errors"
|
|
"fmt"
|
|
"path"
|
|
"runtime"
|
|
"runtime/debug"
|
|
"strconv"
|
|
|
|
"github.com/milvus-io/milvus/internal/metrics"
|
|
|
|
"go.uber.org/zap"
|
|
|
|
"github.com/golang/protobuf/proto"
|
|
"github.com/milvus-io/milvus/internal/kv"
|
|
etcdkv "github.com/milvus-io/milvus/internal/kv/etcd"
|
|
"github.com/milvus-io/milvus/internal/log"
|
|
"github.com/milvus-io/milvus/internal/proto/commonpb"
|
|
"github.com/milvus-io/milvus/internal/proto/indexpb"
|
|
"github.com/milvus-io/milvus/internal/storage"
|
|
"github.com/milvus-io/milvus/internal/util/funcutil"
|
|
"github.com/milvus-io/milvus/internal/util/retry"
|
|
"github.com/milvus-io/milvus/internal/util/timerecord"
|
|
"github.com/milvus-io/milvus/internal/util/trace"
|
|
)
|
|
|
|
const (
|
|
// paramsKeyToParse is the key of the param to build index.
|
|
paramsKeyToParse = "params"
|
|
|
|
// IndexBuildTaskName is the name of the operation to add an index task.
|
|
IndexBuildTaskName = "IndexBuildTask"
|
|
)
|
|
|
|
type task interface {
|
|
Ctx() context.Context
|
|
ID() UniqueID // return ReqID
|
|
Name() string
|
|
SetID(uid UniqueID) // set ReqID
|
|
PreExecute(ctx context.Context) error
|
|
Execute(ctx context.Context) error
|
|
PostExecute(ctx context.Context) error
|
|
WaitToFinish() error
|
|
Notify(err error)
|
|
OnEnqueue() error
|
|
SetError(err error)
|
|
SetState(state TaskState)
|
|
GetState() TaskState
|
|
}
|
|
|
|
// BaseTask is an basic instance of task.
|
|
type BaseTask struct {
|
|
done chan error
|
|
ctx context.Context
|
|
id UniqueID
|
|
err error
|
|
internalErr error
|
|
state TaskState
|
|
}
|
|
|
|
// SetState sets task's state.
|
|
func (bt *BaseTask) SetState(state TaskState) {
|
|
bt.state = state
|
|
}
|
|
|
|
// GetState gets task's state.
|
|
func (bt *BaseTask) GetState() TaskState {
|
|
return bt.state
|
|
}
|
|
|
|
// SetError sets an error to task.
|
|
func (bt *BaseTask) SetError(err error) {
|
|
bt.err = err
|
|
}
|
|
|
|
// ID returns the id of index task.
|
|
func (bt *BaseTask) ID() UniqueID {
|
|
return bt.id
|
|
}
|
|
|
|
// setID set the ID for the task.
|
|
func (bt *BaseTask) setID(id UniqueID) {
|
|
bt.id = id
|
|
}
|
|
|
|
// WaitToFinish will wait for the task to complete, if the context is done, it means that the execution of the task has timed out.
|
|
func (bt *BaseTask) WaitToFinish() error {
|
|
select {
|
|
case <-bt.ctx.Done():
|
|
return errors.New("timeout")
|
|
case err := <-bt.done:
|
|
return err
|
|
}
|
|
}
|
|
|
|
// Notify will notify WaitToFinish that the task is completed or failed.
|
|
func (bt *BaseTask) Notify(err error) {
|
|
bt.done <- err
|
|
}
|
|
|
|
// IndexBuildTask is used to record the information of the index tasks.
|
|
type IndexBuildTask struct {
|
|
BaseTask
|
|
index Index
|
|
kv kv.BaseKV
|
|
etcdKV *etcdkv.EtcdKV
|
|
savePaths []string
|
|
req *indexpb.CreateIndexRequest
|
|
nodeID UniqueID
|
|
serializedSize uint64
|
|
collectionID UniqueID
|
|
partitionID UniqueID
|
|
segmentID UniqueID
|
|
newTypeParams map[string]string
|
|
newIndexParams map[string]string
|
|
tr *timerecord.TimeRecorder
|
|
}
|
|
|
|
// Ctx is the context of index tasks.
|
|
func (it *IndexBuildTask) Ctx() context.Context {
|
|
return it.ctx
|
|
}
|
|
|
|
// ID returns the id of index task.
|
|
func (it *IndexBuildTask) ID() UniqueID {
|
|
return it.id
|
|
}
|
|
|
|
// SetID sets the id for index task.
|
|
func (it *IndexBuildTask) SetID(ID UniqueID) {
|
|
it.BaseTask.setID(ID)
|
|
}
|
|
|
|
// Name is the name of task to build index.
|
|
func (bt *BaseTask) Name() string {
|
|
return IndexBuildTaskName
|
|
}
|
|
|
|
// OnEnqueue enqueues indexing tasks.
|
|
func (it *IndexBuildTask) OnEnqueue() error {
|
|
it.SetID(it.req.IndexBuildID)
|
|
it.SetState(TaskStateNormal)
|
|
log.Debug("IndexNode IndexBuilderTask Enqueue", zap.Int64("taskID", it.ID()), zap.Int64("index buildID", it.req.IndexBuildID))
|
|
it.tr = timerecord.NewTimeRecorder(fmt.Sprintf("IndexBuildTask %d", it.req.IndexBuildID))
|
|
return nil
|
|
}
|
|
|
|
// loadIndexMeta load meta from etcd.
|
|
func (it *IndexBuildTask) loadIndexMeta(ctx context.Context) (*indexpb.IndexMeta, int64, error) {
|
|
indexMeta := indexpb.IndexMeta{}
|
|
var source int64
|
|
fn := func() error {
|
|
//TODO error handling need to be optimized, return Unrecoverable to avoid retry
|
|
_, values, versions, err := it.etcdKV.LoadWithPrefix2(it.req.MetaPath)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
if len(values) == 0 {
|
|
return fmt.Errorf("IndexNode loadIndexMeta get empty")
|
|
}
|
|
err = proto.Unmarshal([]byte(values[0]), &indexMeta)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
source = versions[0]
|
|
return nil
|
|
}
|
|
err := retry.Do(ctx, fn, retry.Attempts(3))
|
|
if err != nil {
|
|
return nil, -1, err
|
|
}
|
|
return &indexMeta, source, nil
|
|
}
|
|
|
|
func (it *IndexBuildTask) updateTaskState(indexMeta *indexpb.IndexMeta) TaskState {
|
|
if indexMeta.Version > it.req.Version || indexMeta.State == commonpb.IndexState_Finished {
|
|
it.SetState(TaskStateAbandon)
|
|
} else if indexMeta.MarkDeleted {
|
|
it.SetState(TaskStateAbandon)
|
|
}
|
|
return it.GetState()
|
|
}
|
|
|
|
// saveIndexMeta try to save index meta to metaKV.
|
|
// if failed, IndexNode will panic to inform indexcoord.
|
|
func (it *IndexBuildTask) saveIndexMeta(ctx context.Context) error {
|
|
defer it.tr.Record("IndexNode IndexBuildTask saveIndexMeta")
|
|
|
|
fn := func() error {
|
|
indexMeta, version, err := it.loadIndexMeta(ctx)
|
|
if err != nil {
|
|
errMsg := fmt.Sprintf("IndexNode IndexBuildTask saveIndexMeta fail to load index meta, IndexBuildID=%d", indexMeta.IndexBuildID)
|
|
panic(errMsg)
|
|
}
|
|
|
|
taskState := it.updateTaskState(indexMeta)
|
|
if taskState == TaskStateAbandon {
|
|
log.Info("IndexNode IndexBuildTask saveIndexMeta", zap.String("TaskState", taskState.String()),
|
|
zap.Int64("IndexBuildID", indexMeta.IndexBuildID))
|
|
return nil
|
|
}
|
|
|
|
indexMeta.IndexFilePaths = it.savePaths
|
|
indexMeta.SerializeSize = it.serializedSize
|
|
|
|
if taskState == TaskStateFailed {
|
|
log.Error("IndexNode IndexBuildTask saveIndexMeta set indexMeta.state to IndexState_Failed",
|
|
zap.String("TaskState", taskState.String()),
|
|
zap.Int64("IndexBuildID", indexMeta.IndexBuildID), zap.Error(it.err))
|
|
indexMeta.State = commonpb.IndexState_Failed
|
|
indexMeta.FailReason = it.err.Error()
|
|
} else if taskState == TaskStateRetry {
|
|
log.Info("IndexNode IndexBuildTask saveIndexMeta set indexMeta.state to IndexState_Unissued",
|
|
zap.String("TaskState", taskState.String()),
|
|
zap.Int64("IndexBuildID", indexMeta.IndexBuildID), zap.Error(it.internalErr))
|
|
indexMeta.State = commonpb.IndexState_Unissued
|
|
} else { // TaskStateNormal
|
|
log.Info("IndexNode IndexBuildTask saveIndexmeta indexMeta.state to IndexState_Unissued",
|
|
zap.String("TaskState", taskState.String()),
|
|
zap.Int64("IndexBuildID", indexMeta.IndexBuildID))
|
|
indexMeta.State = commonpb.IndexState_Finished
|
|
}
|
|
|
|
var metaValue []byte
|
|
metaValue, err = proto.Marshal(indexMeta)
|
|
if err != nil {
|
|
errMsg := fmt.Sprintf("IndexNode IndexBuildTask saveIndexMeta fail to marshal index meta, IndexBuildID=%d, err=%s",
|
|
indexMeta.IndexBuildID, err.Error())
|
|
panic(errMsg)
|
|
}
|
|
|
|
strMetaValue := string(metaValue)
|
|
|
|
return it.etcdKV.CompareVersionAndSwap(it.req.MetaPath, version, strMetaValue)
|
|
}
|
|
|
|
err := retry.Do(ctx, fn, retry.Attempts(3))
|
|
if err != nil {
|
|
panic(err.Error())
|
|
}
|
|
return nil
|
|
}
|
|
|
|
// PreExecute does some checks before building the index, for example, whether the index has been deleted.
|
|
func (it *IndexBuildTask) PreExecute(ctx context.Context) error {
|
|
log.Debug("IndexNode IndexBuildTask preExecute...", zap.Int64("buildId", it.req.IndexBuildID))
|
|
sp, ctx := trace.StartSpanFromContextWithOperationName(ctx, "CreateIndex-PreExecute")
|
|
defer sp.Finish()
|
|
indexMeta, _, err := it.loadIndexMeta(ctx)
|
|
if err != nil {
|
|
// assume that we can loadIndexMeta later...
|
|
return nil
|
|
}
|
|
it.updateTaskState(indexMeta)
|
|
return nil
|
|
}
|
|
|
|
// PostExecute does some checks after building the index, for example, whether the index has been deleted or
|
|
// whether the index task is up to date.
|
|
func (it *IndexBuildTask) PostExecute(ctx context.Context) error {
|
|
log.Debug("IndexNode IndexBuildTask PostExecute...", zap.Int64("buildId", it.req.IndexBuildID))
|
|
sp, _ := trace.StartSpanFromContextWithOperationName(ctx, "CreateIndex-PostExecute")
|
|
defer sp.Finish()
|
|
return it.saveIndexMeta(ctx)
|
|
}
|
|
|
|
func (it *IndexBuildTask) prepareParams(ctx context.Context) error {
|
|
typeParams := make(map[string]string)
|
|
for _, kvPair := range it.req.GetTypeParams() {
|
|
key, value := kvPair.GetKey(), kvPair.GetValue()
|
|
_, ok := typeParams[key]
|
|
if ok {
|
|
return errors.New("duplicated key in type params")
|
|
}
|
|
if key == paramsKeyToParse {
|
|
params, err := funcutil.ParseIndexParamsMap(value)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
for pk, pv := range params {
|
|
typeParams[pk] = pv
|
|
}
|
|
} else {
|
|
typeParams[key] = value
|
|
}
|
|
}
|
|
|
|
indexParams := make(map[string]string)
|
|
for _, kvPair := range it.req.GetIndexParams() {
|
|
key, value := kvPair.GetKey(), kvPair.GetValue()
|
|
_, ok := indexParams[key]
|
|
if ok {
|
|
return errors.New("duplicated key in index params")
|
|
}
|
|
if key == paramsKeyToParse {
|
|
params, err := funcutil.ParseIndexParamsMap(value)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
for pk, pv := range params {
|
|
indexParams[pk] = pv
|
|
}
|
|
} else {
|
|
indexParams[key] = value
|
|
}
|
|
}
|
|
it.newTypeParams = typeParams
|
|
it.newIndexParams = indexParams
|
|
return nil
|
|
}
|
|
|
|
func (it *IndexBuildTask) loadVector(ctx context.Context) (storage.FieldID, storage.FieldData, error) {
|
|
getValueByPath := func(path string) ([]byte, error) {
|
|
data, err := it.kv.Load(path)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
return []byte(data), nil
|
|
}
|
|
getBlobByPath := func(path string) (*Blob, error) {
|
|
value, err := getValueByPath(path)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
return &Blob{
|
|
Key: path,
|
|
Value: value,
|
|
}, nil
|
|
}
|
|
|
|
toLoadDataPaths := it.req.GetDataPaths()
|
|
keys := make([]string, len(toLoadDataPaths))
|
|
blobs := make([]*Blob, len(toLoadDataPaths))
|
|
|
|
loadKey := func(idx int) error {
|
|
keys[idx] = toLoadDataPaths[idx]
|
|
blob, err := getBlobByPath(toLoadDataPaths[idx])
|
|
if err != nil {
|
|
return err
|
|
}
|
|
blobs[idx] = blob
|
|
return nil
|
|
}
|
|
// Use runtime.GOMAXPROCS(0) instead of runtime.NumCPU()
|
|
// to respect CPU quota of container/pod
|
|
// gomaxproc will be set by `automaxproc`, passing 0 will just retrieve the value
|
|
err := funcutil.ProcessFuncParallel(len(toLoadDataPaths), runtime.GOMAXPROCS(0), loadKey, "loadKey")
|
|
if err != nil {
|
|
log.Warn("loadKey from minio failed", zap.Error(err))
|
|
it.internalErr = err
|
|
// In this case, it.internalErr is no longer nil and err does not need to be returned, otherwise it.err will also be assigned.
|
|
return storage.InvalidUniqueID, nil, err
|
|
}
|
|
loadVectorDuration := it.tr.RecordSpan()
|
|
log.Debug("IndexNode load data success", zap.Int64("buildId", it.req.IndexBuildID))
|
|
it.tr.Record("load vector data done")
|
|
|
|
var insertCodec storage.InsertCodec
|
|
collectionID, partitionID, segmentID, insertData, err2 := insertCodec.DeserializeAll(blobs)
|
|
if err2 != nil {
|
|
return storage.InvalidUniqueID, nil, err2
|
|
}
|
|
|
|
// TODO: @xiaocai2333 metrics.IndexNodeLoadBinlogLatency should be added above, put here to get segmentID.
|
|
metrics.IndexNodeLoadBinlogLatency.WithLabelValues(strconv.FormatInt(Params.IndexNodeCfg.NodeID, 10), strconv.FormatInt(it.segmentID, 10)).Observe(float64(loadVectorDuration))
|
|
metrics.IndexNodeDecodeBinlogLatency.WithLabelValues(strconv.FormatInt(Params.IndexNodeCfg.NodeID, 10), strconv.FormatInt(it.segmentID, 10)).Observe(float64(it.tr.RecordSpan()))
|
|
|
|
if len(insertData.Data) != 1 {
|
|
return storage.InvalidUniqueID, nil, errors.New("we expect only one field in deserialized insert data")
|
|
}
|
|
it.collectionID = collectionID
|
|
it.partitionID = partitionID
|
|
it.segmentID = segmentID
|
|
|
|
log.Debug("IndexNode deserialize data success",
|
|
zap.Int64("taskID", it.ID()),
|
|
zap.Int64("IndexID", it.req.IndexID),
|
|
zap.Int64("index buildID", it.req.IndexBuildID),
|
|
zap.Int64("collectionID", it.collectionID),
|
|
zap.Int64("partitionID", it.partitionID),
|
|
zap.Int64("segmentID", it.segmentID))
|
|
|
|
it.tr.Record("deserialize vector data done")
|
|
|
|
// we can ensure that there blobs are in one Field
|
|
var data storage.FieldData
|
|
var fieldID storage.FieldID
|
|
for fID, value := range insertData.Data {
|
|
data = value
|
|
fieldID = fID
|
|
break
|
|
}
|
|
return fieldID, data, nil
|
|
}
|
|
|
|
func (it *IndexBuildTask) buildIndex(ctx context.Context) ([]*storage.Blob, error) {
|
|
var fieldID storage.FieldID
|
|
{
|
|
var err error
|
|
var fieldData storage.FieldData
|
|
fieldID, fieldData, err = it.loadVector(ctx)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
floatVectorFieldData, fOk := fieldData.(*storage.FloatVectorFieldData)
|
|
if fOk {
|
|
err := it.index.BuildFloatVecIndexWithoutIds(floatVectorFieldData.Data)
|
|
if err != nil {
|
|
log.Error("IndexNode BuildFloatVecIndexWithoutIds failed", zap.Error(err))
|
|
return nil, err
|
|
}
|
|
}
|
|
binaryVectorFieldData, bOk := fieldData.(*storage.BinaryVectorFieldData)
|
|
if bOk {
|
|
err := it.index.BuildBinaryVecIndexWithoutIds(binaryVectorFieldData.Data)
|
|
if err != nil {
|
|
log.Error("IndexNode BuildBinaryVecIndexWithoutIds failed", zap.Error(err))
|
|
return nil, err
|
|
}
|
|
}
|
|
|
|
metrics.IndexNodeKnowhereBuildIndexLatency.WithLabelValues(strconv.FormatInt(Params.IndexNodeCfg.NodeID, 10), strconv.FormatInt(it.segmentID, 10)).Observe(float64(it.tr.RecordSpan()))
|
|
|
|
if !fOk && !bOk {
|
|
return nil, errors.New("we expect FloatVectorFieldData or BinaryVectorFieldData")
|
|
}
|
|
it.tr.Record("build index done")
|
|
}
|
|
|
|
indexBlobs, err := it.index.Serialize()
|
|
if err != nil {
|
|
log.Error("IndexNode index Serialize failed", zap.Error(err))
|
|
return nil, err
|
|
}
|
|
it.tr.Record("index serialize done")
|
|
|
|
// early release index for gc, and we can ensure that Delete is idempotent.
|
|
if err := it.index.Delete(); err != nil {
|
|
log.Error("IndexNode IndexBuildTask Execute CIndexDelete failed",
|
|
zap.Int64("buildId", it.req.IndexBuildID),
|
|
zap.Error(err))
|
|
}
|
|
|
|
var serializedIndexBlobs []*storage.Blob
|
|
codec := storage.NewIndexFileBinlogCodec()
|
|
serializedIndexBlobs, err = codec.Serialize(
|
|
it.req.IndexBuildID,
|
|
it.req.Version,
|
|
it.collectionID,
|
|
it.partitionID,
|
|
it.segmentID,
|
|
fieldID,
|
|
it.newIndexParams,
|
|
it.req.IndexName,
|
|
it.req.IndexID,
|
|
indexBlobs,
|
|
)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
encodeIndexFileDur := it.tr.Record("index codec serialize done")
|
|
metrics.IndexNodeEncodeIndexFileLatency.WithLabelValues(strconv.FormatInt(Params.IndexNodeCfg.NodeID, 10),
|
|
strconv.FormatInt(it.segmentID, 10)).Observe(float64(encodeIndexFileDur.Milliseconds()))
|
|
return serializedIndexBlobs, nil
|
|
}
|
|
|
|
func (it *IndexBuildTask) saveIndex(ctx context.Context, blobs []*storage.Blob) error {
|
|
blobCnt := len(blobs)
|
|
it.serializedSize = 0
|
|
for i := range blobs {
|
|
it.serializedSize += uint64(len(blobs[i].Value))
|
|
}
|
|
|
|
getSavePathByKey := func(key string) string {
|
|
return path.Join(Params.IndexNodeCfg.IndexStorageRootPath, strconv.Itoa(int(it.req.IndexBuildID)), strconv.Itoa(int(it.req.Version)),
|
|
strconv.Itoa(int(it.partitionID)), strconv.Itoa(int(it.segmentID)), key)
|
|
}
|
|
|
|
it.savePaths = make([]string, blobCnt)
|
|
saveIndexFile := func(idx int) error {
|
|
blob := blobs[idx]
|
|
savePath := getSavePathByKey(blob.Key)
|
|
saveIndexFileFn := func() error {
|
|
v, err := it.etcdKV.Load(it.req.MetaPath)
|
|
if err != nil {
|
|
log.Warn("IndexNode load meta failed", zap.Any("path", it.req.MetaPath), zap.Error(err))
|
|
return err
|
|
}
|
|
indexMeta := indexpb.IndexMeta{}
|
|
err = proto.Unmarshal([]byte(v), &indexMeta)
|
|
if err != nil {
|
|
log.Warn("IndexNode Unmarshal indexMeta error ", zap.Error(err))
|
|
return err
|
|
}
|
|
//log.Debug("IndexNode Unmarshal indexMeta success ", zap.Any("meta", indexMeta))
|
|
if indexMeta.Version > it.req.Version {
|
|
log.Warn("IndexNode try saveIndexFile failed req.Version is low", zap.Any("req.Version", it.req.Version),
|
|
zap.Any("indexMeta.Version", indexMeta.Version))
|
|
return errors.New("This task has been reassigned, check indexMeta.version and request ")
|
|
}
|
|
return it.kv.Save(savePath, string(blob.Value))
|
|
}
|
|
err := retry.Do(ctx, saveIndexFileFn, retry.Attempts(5))
|
|
if err != nil {
|
|
log.Warn("IndexNode try saveIndexFile final", zap.Error(err), zap.Any("savePath", savePath))
|
|
return err
|
|
}
|
|
it.savePaths[idx] = savePath
|
|
return nil
|
|
}
|
|
|
|
err := funcutil.ProcessFuncParallel(blobCnt, runtime.NumCPU(), saveIndexFile, "saveIndexFile")
|
|
if err != nil {
|
|
log.Warn("saveIndexFile to minio failed", zap.Error(err))
|
|
// In this case, we intend not to return err, otherwise the task will be marked as failed.
|
|
it.internalErr = err
|
|
}
|
|
return nil
|
|
}
|
|
|
|
func (it *IndexBuildTask) releaseMemory() {
|
|
debug.FreeOSMemory()
|
|
}
|
|
|
|
// Execute actually performs the task of building an index.
|
|
func (it *IndexBuildTask) Execute(ctx context.Context) error {
|
|
log.Debug("IndexNode IndexBuildTask Execute ...", zap.Int64("buildId", it.req.IndexBuildID))
|
|
sp, _ := trace.StartSpanFromContextWithOperationName(ctx, "CreateIndex-Execute")
|
|
defer sp.Finish()
|
|
|
|
if err := it.prepareParams(ctx); err != nil {
|
|
it.SetState(TaskStateFailed)
|
|
log.Error("IndexNode IndexBuildTask Execute prepareParams failed",
|
|
zap.Int64("buildId", it.req.IndexBuildID),
|
|
zap.Error(err))
|
|
return err
|
|
}
|
|
|
|
defer it.releaseMemory()
|
|
|
|
var err error
|
|
it.index, err = NewCIndex(it.newTypeParams, it.newIndexParams)
|
|
if err != nil {
|
|
it.SetState(TaskStateFailed)
|
|
log.Error("IndexNode IndexBuildTask Execute NewCIndex failed",
|
|
zap.Int64("buildId", it.req.IndexBuildID),
|
|
zap.Error(err))
|
|
return err
|
|
}
|
|
|
|
defer func() {
|
|
err := it.index.Delete()
|
|
if err != nil {
|
|
log.Error("IndexNode IndexBuildTask Execute CIndexDelete failed",
|
|
zap.Int64("buildId", it.req.IndexBuildID),
|
|
zap.Error(err))
|
|
}
|
|
}()
|
|
|
|
it.tr.Record("new CIndex")
|
|
var blobs []*storage.Blob
|
|
blobs, err = it.buildIndex(ctx)
|
|
if err != nil {
|
|
it.SetState(TaskStateFailed)
|
|
log.Error("IndexNode IndexBuildTask Execute buildIndex failed",
|
|
zap.Int64("buildId", it.req.IndexBuildID),
|
|
zap.Error(err))
|
|
return err
|
|
}
|
|
|
|
err = it.saveIndex(ctx, blobs)
|
|
if err != nil {
|
|
it.SetState(TaskStateRetry)
|
|
return err
|
|
}
|
|
saveIndexFileDur := it.tr.Record("index file save done")
|
|
metrics.IndexNodeSaveIndexFileLatency.WithLabelValues(strconv.FormatInt(Params.IndexNodeCfg.NodeID, 10),
|
|
strconv.FormatInt(it.segmentID, 10)).Observe(float64(saveIndexFileDur.Milliseconds()))
|
|
it.tr.Elapse("index building all done")
|
|
log.Info("IndexNode CreateIndex successfully ", zap.Int64("collect", it.collectionID),
|
|
zap.Int64("partition", it.partitionID), zap.Int64("segment", it.segmentID))
|
|
|
|
return nil
|
|
}
|