mirror of
https://gitee.com/milvus-io/milvus.git
synced 2024-12-05 13:28:49 +08:00
639800241d
Signed-off-by: godchen <qingxiang.chen@zilliz.com>
167 lines
5.2 KiB
Go
167 lines
5.2 KiB
Go
// Licensed to the LF AI & Data foundation under one
|
|
// or more contributor license agreements. See the NOTICE file
|
|
// distributed with this work for additional information
|
|
// regarding copyright ownership. The ASF licenses this file
|
|
// to you under the Apache License, Version 2.0 (the
|
|
// "License"); you may not use this file except in compliance
|
|
// with the License. You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
package msgstream
|
|
|
|
import (
|
|
"errors"
|
|
"fmt"
|
|
"strconv"
|
|
|
|
"github.com/milvus-io/milvus/internal/proto/commonpb"
|
|
"github.com/milvus-io/milvus/internal/proto/internalpb"
|
|
)
|
|
|
|
// InsertRepackFunc is used to repack messages after hash by primary key
|
|
func InsertRepackFunc(tsMsgs []TsMsg, hashKeys [][]int32) (map[int32]*MsgPack, error) {
|
|
result := make(map[int32]*MsgPack)
|
|
for i, request := range tsMsgs {
|
|
if request.Type() != commonpb.MsgType_Insert {
|
|
return nil, errors.New("msg's must be Insert")
|
|
}
|
|
insertRequest := request.(*InsertMsg)
|
|
keys := hashKeys[i]
|
|
|
|
timestampLen := len(insertRequest.Timestamps)
|
|
rowIDLen := len(insertRequest.RowIDs)
|
|
rowDataLen := len(insertRequest.RowData)
|
|
keysLen := len(keys)
|
|
|
|
if keysLen != timestampLen || keysLen != rowIDLen || keysLen != rowDataLen {
|
|
return nil, errors.New("the length of hashValue, timestamps, rowIDs, RowData are not equal")
|
|
}
|
|
for index, key := range keys {
|
|
_, ok := result[key]
|
|
if !ok {
|
|
msgPack := MsgPack{}
|
|
result[key] = &msgPack
|
|
}
|
|
|
|
sliceRequest := internalpb.InsertRequest{
|
|
Base: &commonpb.MsgBase{
|
|
MsgType: commonpb.MsgType_Insert,
|
|
MsgID: insertRequest.Base.MsgID,
|
|
Timestamp: insertRequest.Timestamps[index],
|
|
SourceID: insertRequest.Base.SourceID,
|
|
},
|
|
DbID: insertRequest.DbID,
|
|
CollectionID: insertRequest.CollectionID,
|
|
PartitionID: insertRequest.PartitionID,
|
|
CollectionName: insertRequest.CollectionName,
|
|
PartitionName: insertRequest.PartitionName,
|
|
SegmentID: insertRequest.SegmentID,
|
|
ShardName: insertRequest.ShardName,
|
|
Timestamps: []uint64{insertRequest.Timestamps[index]},
|
|
RowIDs: []int64{insertRequest.RowIDs[index]},
|
|
RowData: []*commonpb.Blob{insertRequest.RowData[index]},
|
|
}
|
|
|
|
insertMsg := &InsertMsg{
|
|
BaseMsg: BaseMsg{
|
|
Ctx: request.TraceCtx(),
|
|
},
|
|
InsertRequest: sliceRequest,
|
|
}
|
|
result[key].Msgs = append(result[key].Msgs, insertMsg)
|
|
}
|
|
}
|
|
return result, nil
|
|
}
|
|
|
|
// DeleteRepackFunc is used to repack messages after hash by primary key
|
|
func DeleteRepackFunc(tsMsgs []TsMsg, hashKeys [][]int32) (map[int32]*MsgPack, error) {
|
|
result := make(map[int32]*MsgPack)
|
|
for i, request := range tsMsgs {
|
|
if request.Type() != commonpb.MsgType_Delete {
|
|
return nil, errors.New("msg's must be Delete")
|
|
}
|
|
deleteRequest := request.(*DeleteMsg)
|
|
keys := hashKeys[i]
|
|
|
|
if len(keys) != 1 {
|
|
return nil, errors.New("len(msg.hashValue) must equal 1, but it is: " + strconv.Itoa(len(keys)))
|
|
}
|
|
|
|
timestampLen := len(deleteRequest.Timestamps)
|
|
pkLen := len(deleteRequest.PrimaryKeys)
|
|
keysLen := len(keys)
|
|
|
|
if keysLen != timestampLen || keysLen != pkLen {
|
|
return nil, errors.New("the length of hashValue, timestamps, primaryKeys are not equal")
|
|
}
|
|
|
|
for index, key := range keys {
|
|
_, ok := result[key]
|
|
if !ok {
|
|
msgPack := MsgPack{}
|
|
result[key] = &msgPack
|
|
}
|
|
|
|
sliceRequest := internalpb.DeleteRequest{
|
|
Base: &commonpb.MsgBase{
|
|
MsgType: commonpb.MsgType_Delete,
|
|
MsgID: deleteRequest.Base.MsgID,
|
|
Timestamp: deleteRequest.Timestamps[index],
|
|
SourceID: deleteRequest.Base.SourceID,
|
|
},
|
|
DbID: deleteRequest.DbID,
|
|
CollectionID: deleteRequest.CollectionID,
|
|
PartitionID: deleteRequest.PartitionID,
|
|
CollectionName: deleteRequest.CollectionName,
|
|
PartitionName: deleteRequest.PartitionName,
|
|
ShardName: deleteRequest.ShardName,
|
|
Timestamps: []uint64{deleteRequest.Timestamps[index]},
|
|
PrimaryKeys: []int64{deleteRequest.PrimaryKeys[index]},
|
|
}
|
|
|
|
deleteMsg := &DeleteMsg{
|
|
BaseMsg: BaseMsg{
|
|
Ctx: request.TraceCtx(),
|
|
},
|
|
DeleteRequest: sliceRequest,
|
|
}
|
|
result[key].Msgs = append(result[key].Msgs, deleteMsg)
|
|
}
|
|
}
|
|
return result, nil
|
|
}
|
|
|
|
// DefaultRepackFunc is used to repack messages after hash by primary key
|
|
func DefaultRepackFunc(tsMsgs []TsMsg, hashKeys [][]int32) (map[int32]*MsgPack, error) {
|
|
if len(hashKeys) < len(tsMsgs) {
|
|
return nil, fmt.Errorf(
|
|
"the length of hash keys (%d) is less than the length of messages (%d)",
|
|
len(hashKeys),
|
|
len(tsMsgs),
|
|
)
|
|
}
|
|
|
|
// after assigning segment id to msg, tsMsgs was already re-bucketed
|
|
pack := make(map[int32]*MsgPack)
|
|
for idx, msg := range tsMsgs {
|
|
if len(hashKeys[idx]) <= 0 {
|
|
return nil, fmt.Errorf("no hash key for %dth message", idx)
|
|
}
|
|
key := hashKeys[idx][0]
|
|
_, ok := pack[key]
|
|
if !ok {
|
|
pack[key] = &MsgPack{}
|
|
}
|
|
pack[key].Msgs = append(pack[key].Msgs, msg)
|
|
}
|
|
return pack, nil
|
|
}
|