2021-04-19 15:16:33 +08:00
|
|
|
// Copyright (C) 2019-2020 Zilliz. All rights reserved.
|
|
|
|
//
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance
|
|
|
|
// with the License. You may obtain a copy of the License at
|
|
|
|
//
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software distributed under the License
|
|
|
|
// is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express
|
|
|
|
// or implied. See the License for the specific language governing permissions and limitations under the License.
|
|
|
|
|
2021-01-19 11:37:16 +08:00
|
|
|
package datanode
|
|
|
|
|
|
|
|
import (
|
2021-06-07 13:58:37 +08:00
|
|
|
"sync"
|
|
|
|
|
2021-02-26 10:13:36 +08:00
|
|
|
"go.uber.org/zap"
|
|
|
|
|
2021-04-22 14:45:57 +08:00
|
|
|
"github.com/milvus-io/milvus/internal/log"
|
|
|
|
"github.com/milvus-io/milvus/internal/msgstream"
|
2021-06-02 15:58:33 +08:00
|
|
|
"github.com/milvus-io/milvus/internal/proto/commonpb"
|
2021-06-07 13:58:37 +08:00
|
|
|
"github.com/milvus-io/milvus/internal/proto/datapb"
|
2021-06-02 15:58:33 +08:00
|
|
|
"github.com/milvus-io/milvus/internal/proto/internalpb"
|
2021-04-22 14:45:57 +08:00
|
|
|
"github.com/milvus-io/milvus/internal/util/flowgraph"
|
2021-01-19 11:37:16 +08:00
|
|
|
)
|
|
|
|
|
|
|
|
type ddNode struct {
|
|
|
|
BaseNode
|
2021-06-07 11:25:37 +08:00
|
|
|
|
|
|
|
clearSignal chan<- UniqueID
|
|
|
|
collectionID UniqueID
|
2021-06-07 13:58:37 +08:00
|
|
|
|
2021-06-08 19:25:37 +08:00
|
|
|
mu sync.RWMutex
|
|
|
|
seg2SegInfo map[UniqueID]*datapb.SegmentInfo // Segment ID to UnFlushed Segment
|
|
|
|
vchanInfo *datapb.VchannelInfo
|
2021-01-19 11:37:16 +08:00
|
|
|
}
|
|
|
|
|
2021-06-02 15:58:33 +08:00
|
|
|
func (ddn *ddNode) Name() string {
|
2021-01-19 11:37:16 +08:00
|
|
|
return "ddNode"
|
|
|
|
}
|
|
|
|
|
2021-06-02 15:58:33 +08:00
|
|
|
func (ddn *ddNode) Operate(in []flowgraph.Msg) []flowgraph.Msg {
|
2021-06-08 19:25:37 +08:00
|
|
|
|
|
|
|
// log.Debug("DDNode Operating")
|
|
|
|
|
2021-01-19 11:37:16 +08:00
|
|
|
if len(in) != 1 {
|
2021-02-26 10:13:36 +08:00
|
|
|
log.Error("Invalid operate message input in ddNode", zap.Int("input length", len(in)))
|
2021-01-19 11:37:16 +08:00
|
|
|
// TODO: add error handling
|
|
|
|
}
|
|
|
|
|
2021-05-31 15:28:30 +08:00
|
|
|
if len(in) == 0 {
|
|
|
|
return []flowgraph.Msg{}
|
|
|
|
}
|
|
|
|
|
2021-02-25 17:35:36 +08:00
|
|
|
msMsg, ok := in[0].(*MsgStreamMsg)
|
2021-01-19 11:37:16 +08:00
|
|
|
if !ok {
|
2021-02-26 10:13:36 +08:00
|
|
|
log.Error("type assertion failed for MsgStreamMsg")
|
2021-01-19 11:37:16 +08:00
|
|
|
// TODO: add error handling
|
|
|
|
}
|
|
|
|
|
2021-03-23 01:49:50 +08:00
|
|
|
if msMsg == nil {
|
2021-03-25 14:41:46 +08:00
|
|
|
return []Msg{}
|
|
|
|
}
|
2021-03-23 01:49:50 +08:00
|
|
|
|
2021-06-02 15:58:33 +08:00
|
|
|
var iMsg = insertMsg{
|
|
|
|
insertMessages: make([]*msgstream.InsertMsg, 0),
|
2021-01-19 11:37:16 +08:00
|
|
|
timeRange: TimeRange{
|
|
|
|
timestampMin: msMsg.TimestampMin(),
|
|
|
|
timestampMax: msMsg.TimestampMax(),
|
|
|
|
},
|
2021-06-02 15:58:33 +08:00
|
|
|
startPositions: make([]*internalpb.MsgPosition, 0),
|
|
|
|
endPositions: make([]*internalpb.MsgPosition, 0),
|
2021-01-19 11:37:16 +08:00
|
|
|
}
|
|
|
|
|
2021-06-02 15:58:33 +08:00
|
|
|
for _, msg := range msMsg.TsMessages() {
|
|
|
|
switch msg.Type() {
|
|
|
|
case commonpb.MsgType_DropCollection:
|
2021-06-07 11:25:37 +08:00
|
|
|
if msg.(*msgstream.DropCollectionMsg).GetCollectionID() == ddn.collectionID {
|
2021-06-09 17:31:48 +08:00
|
|
|
log.Info("Destroying current flowgraph", zap.Any("collectionID", ddn.collectionID))
|
2021-06-07 11:25:37 +08:00
|
|
|
ddn.clearSignal <- ddn.collectionID
|
|
|
|
}
|
2021-06-02 15:58:33 +08:00
|
|
|
case commonpb.MsgType_Insert:
|
2021-06-08 19:25:37 +08:00
|
|
|
log.Debug("DDNode with insert messages")
|
2021-06-07 13:58:37 +08:00
|
|
|
if msg.EndTs() < FilterThreshold {
|
2021-06-08 19:25:37 +08:00
|
|
|
log.Info("Filtering Insert Messages",
|
|
|
|
zap.Uint64("Message endts", msg.EndTs()),
|
|
|
|
zap.Uint64("FilterThreshold", FilterThreshold),
|
|
|
|
)
|
2021-06-11 09:24:52 +08:00
|
|
|
if ddn.filterFlushedSegmentInsertMessages(msg.(*msgstream.InsertMsg)) {
|
|
|
|
continue
|
2021-06-07 13:58:37 +08:00
|
|
|
}
|
2021-05-31 15:28:30 +08:00
|
|
|
}
|
2021-06-07 13:58:37 +08:00
|
|
|
iMsg.insertMessages = append(iMsg.insertMessages, msg.(*msgstream.InsertMsg))
|
2021-01-19 11:37:16 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-06-02 15:58:33 +08:00
|
|
|
iMsg.startPositions = append(iMsg.startPositions, msMsg.StartPositions()...)
|
|
|
|
iMsg.endPositions = append(iMsg.endPositions, msMsg.EndPositions()...)
|
2021-01-22 19:36:09 +08:00
|
|
|
|
2021-06-02 15:58:33 +08:00
|
|
|
var res Msg = &iMsg
|
2021-05-25 15:35:37 +08:00
|
|
|
|
2021-03-25 14:41:46 +08:00
|
|
|
return []Msg{res}
|
2021-01-19 11:37:16 +08:00
|
|
|
}
|
|
|
|
|
2021-06-11 09:24:52 +08:00
|
|
|
func (ddn *ddNode) filterFlushedSegmentInsertMessages(msg *msgstream.InsertMsg) bool {
|
2021-06-07 13:58:37 +08:00
|
|
|
if ddn.isFlushed(msg.GetSegmentID()) {
|
2021-06-11 09:24:52 +08:00
|
|
|
return true
|
2021-06-07 13:58:37 +08:00
|
|
|
}
|
|
|
|
|
2021-06-08 19:25:37 +08:00
|
|
|
ddn.mu.Lock()
|
|
|
|
if si, ok := ddn.seg2SegInfo[msg.GetSegmentID()]; ok {
|
2021-06-11 11:37:24 +08:00
|
|
|
if msg.EndTs() <= si.GetDmlPosition().GetTimestamp() {
|
2021-06-11 09:24:52 +08:00
|
|
|
return true
|
2021-06-07 13:58:37 +08:00
|
|
|
}
|
2021-06-11 11:37:24 +08:00
|
|
|
delete(ddn.seg2SegInfo, msg.GetSegmentID())
|
2021-06-07 13:58:37 +08:00
|
|
|
}
|
|
|
|
|
2021-06-08 19:25:37 +08:00
|
|
|
ddn.mu.Unlock()
|
2021-06-11 09:24:52 +08:00
|
|
|
return false
|
2021-05-19 19:42:07 +08:00
|
|
|
}
|
|
|
|
|
2021-06-07 13:58:37 +08:00
|
|
|
func (ddn *ddNode) isFlushed(segmentID UniqueID) bool {
|
|
|
|
ddn.mu.Lock()
|
|
|
|
defer ddn.mu.Unlock()
|
|
|
|
|
|
|
|
for _, id := range ddn.vchanInfo.GetFlushedSegments() {
|
|
|
|
if id == segmentID {
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
|
|
|
func newDDNode(clearSignal chan<- UniqueID, collID UniqueID, vchanInfo *datapb.VchannelInfo) *ddNode {
|
2021-01-19 11:37:16 +08:00
|
|
|
baseNode := BaseNode{}
|
2021-06-02 15:58:33 +08:00
|
|
|
baseNode.SetMaxParallelism(Params.FlowGraphMaxQueueLength)
|
2021-01-19 11:37:16 +08:00
|
|
|
|
2021-06-08 19:25:37 +08:00
|
|
|
si := make(map[UniqueID]*datapb.SegmentInfo)
|
|
|
|
for _, us := range vchanInfo.GetUnflushedSegments() {
|
|
|
|
si[us.GetID()] = us
|
2021-06-07 13:58:37 +08:00
|
|
|
}
|
|
|
|
|
2021-01-19 11:37:16 +08:00
|
|
|
return &ddNode{
|
2021-06-07 11:25:37 +08:00
|
|
|
BaseNode: baseNode,
|
|
|
|
clearSignal: clearSignal,
|
|
|
|
collectionID: collID,
|
2021-06-08 19:25:37 +08:00
|
|
|
seg2SegInfo: si,
|
2021-06-07 13:58:37 +08:00
|
|
|
vchanInfo: vchanInfo,
|
2021-01-19 11:37:16 +08:00
|
|
|
}
|
|
|
|
}
|