mirror of
https://gitee.com/milvus-io/milvus.git
synced 2024-12-05 05:18:52 +08:00
1c1f2a1371
related #29588 Signed-off-by: lixinguo <xinguo.li@zilliz.com> Co-authored-by: lixinguo <xinguo.li@zilliz.com>
202 lines
5.9 KiB
Go
202 lines
5.9 KiB
Go
// Licensed to the LF AI & Data foundation under one
|
|
// or more contributor license agreements. See the NOTICE file
|
|
// distributed with this work for additional information
|
|
// regarding copyright ownership. The ASF licenses this file
|
|
// to you under the Apache License, Version 2.0 (the
|
|
// "License"); you may not use this file except in compliance
|
|
// with the License. You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
package flowgraph
|
|
|
|
import (
|
|
"context"
|
|
"fmt"
|
|
"time"
|
|
|
|
"go.opentelemetry.io/otel"
|
|
"go.opentelemetry.io/otel/trace"
|
|
"go.uber.org/atomic"
|
|
"go.uber.org/zap"
|
|
|
|
"github.com/milvus-io/milvus-proto/go-api/v2/commonpb"
|
|
"github.com/milvus-io/milvus/pkg/log"
|
|
"github.com/milvus-io/milvus/pkg/metrics"
|
|
"github.com/milvus-io/milvus/pkg/mq/msgstream"
|
|
"github.com/milvus-io/milvus/pkg/util/paramtable"
|
|
"github.com/milvus-io/milvus/pkg/util/tsoutil"
|
|
"github.com/milvus-io/milvus/pkg/util/typeutil"
|
|
)
|
|
|
|
const (
|
|
CloseGracefully bool = true
|
|
CloseImmediately bool = false
|
|
)
|
|
|
|
// InputNode is the entry point of flowgragh
|
|
type InputNode struct {
|
|
BaseNode
|
|
input <-chan *msgstream.MsgPack
|
|
lastMsg *msgstream.MsgPack
|
|
name string
|
|
role string
|
|
nodeID int64
|
|
collectionID int64
|
|
dataType string
|
|
|
|
closeGracefully *atomic.Bool
|
|
|
|
skipMode bool
|
|
skipCount int
|
|
lastNotTimetickTime time.Time
|
|
}
|
|
|
|
// IsInputNode returns whether Node is InputNode
|
|
func (inNode *InputNode) IsInputNode() bool {
|
|
return true
|
|
}
|
|
|
|
func (inNode *InputNode) IsValidInMsg(in []Msg) bool {
|
|
return true
|
|
}
|
|
|
|
// Name returns node name
|
|
func (inNode *InputNode) Name() string {
|
|
return inNode.name
|
|
}
|
|
|
|
func (inNode *InputNode) SetCloseMethod(gracefully bool) {
|
|
inNode.closeGracefully.Store(gracefully)
|
|
log.Info("input node close method set",
|
|
zap.String("node", inNode.Name()),
|
|
zap.Int64("collection", inNode.collectionID),
|
|
zap.Bool("gracefully", gracefully))
|
|
}
|
|
|
|
// Operate consume a message pack from msgstream and return
|
|
func (inNode *InputNode) Operate(in []Msg) []Msg {
|
|
msgPack, ok := <-inNode.input
|
|
if !ok {
|
|
log := log.With(
|
|
zap.String("node", inNode.Name()),
|
|
zap.Int64("collection", inNode.collectionID),
|
|
)
|
|
log.Info("input node message stream closed",
|
|
zap.Bool("closeGracefully", inNode.closeGracefully.Load()),
|
|
)
|
|
if inNode.lastMsg != nil && inNode.closeGracefully.Load() {
|
|
log.Info("input node trigger force sync",
|
|
zap.Any("position", inNode.lastMsg.EndPositions))
|
|
return []Msg{&MsgStreamMsg{
|
|
BaseMsg: NewBaseMsg(true),
|
|
tsMessages: []msgstream.TsMsg{},
|
|
timestampMin: inNode.lastMsg.BeginTs,
|
|
timestampMax: inNode.lastMsg.EndTs,
|
|
startPositions: inNode.lastMsg.StartPositions,
|
|
endPositions: inNode.lastMsg.EndPositions,
|
|
}}
|
|
}
|
|
return []Msg{&MsgStreamMsg{
|
|
BaseMsg: NewBaseMsg(true),
|
|
}}
|
|
}
|
|
|
|
// TODO: add status
|
|
if msgPack == nil {
|
|
return []Msg{}
|
|
}
|
|
|
|
inNode.lastMsg = msgPack
|
|
sub := tsoutil.SubByNow(msgPack.EndTs)
|
|
if inNode.role == typeutil.DataNodeRole {
|
|
metrics.DataNodeConsumeMsgCount.
|
|
WithLabelValues(fmt.Sprint(inNode.nodeID), inNode.dataType, fmt.Sprint(inNode.collectionID)).
|
|
Inc()
|
|
|
|
metrics.DataNodeConsumeTimeTickLag.
|
|
WithLabelValues(fmt.Sprint(inNode.nodeID), inNode.dataType, fmt.Sprint(inNode.collectionID)).
|
|
Set(float64(sub))
|
|
}
|
|
|
|
var spans []trace.Span
|
|
defer func() {
|
|
for _, span := range spans {
|
|
span.End()
|
|
}
|
|
}()
|
|
for _, msg := range msgPack.Msgs {
|
|
ctx := msg.TraceCtx()
|
|
if ctx == nil {
|
|
ctx = context.Background()
|
|
}
|
|
ctx, sp := otel.Tracer(inNode.role).Start(ctx, "Operate")
|
|
sp.AddEvent("input_node name" + inNode.Name())
|
|
spans = append(spans, sp)
|
|
msg.SetTraceCtx(ctx)
|
|
}
|
|
|
|
// skip timetick message feature
|
|
if inNode.role == typeutil.DataNodeRole &&
|
|
len(msgPack.Msgs) > 0 &&
|
|
paramtable.Get().DataNodeCfg.FlowGraphSkipModeEnable.GetAsBool() {
|
|
if msgPack.Msgs[0].Type() == commonpb.MsgType_TimeTick {
|
|
if inNode.skipMode {
|
|
// if empty timetick message and in skipMode, will skip some of the timetick messages to reduce downstream work
|
|
if inNode.skipCount == paramtable.Get().DataNodeCfg.FlowGraphSkipModeSkipNum.GetAsInt() {
|
|
inNode.skipCount = 0
|
|
} else {
|
|
inNode.skipCount = inNode.skipCount + 1
|
|
return []Msg{}
|
|
}
|
|
} else {
|
|
cd := paramtable.Get().DataNodeCfg.FlowGraphSkipModeColdTime.GetAsInt()
|
|
if time.Since(inNode.lastNotTimetickTime) > time.Second*time.Duration(cd) {
|
|
inNode.skipMode = true
|
|
}
|
|
}
|
|
} else {
|
|
// if non empty message, refresh the lastNotTimetickTime and close skip mode
|
|
inNode.skipMode = false
|
|
inNode.skipCount = 0
|
|
inNode.lastNotTimetickTime = time.Now()
|
|
}
|
|
}
|
|
|
|
var msgStreamMsg Msg = &MsgStreamMsg{
|
|
tsMessages: msgPack.Msgs,
|
|
timestampMin: msgPack.BeginTs,
|
|
timestampMax: msgPack.EndTs,
|
|
startPositions: msgPack.StartPositions,
|
|
endPositions: msgPack.EndPositions,
|
|
}
|
|
|
|
return []Msg{msgStreamMsg}
|
|
}
|
|
|
|
// NewInputNode composes an InputNode with provided input channel, name and parameters
|
|
func NewInputNode(input <-chan *msgstream.MsgPack, nodeName string, maxQueueLength int32, maxParallelism int32, role string, nodeID int64, collectionID int64, dataType string) *InputNode {
|
|
baseNode := BaseNode{}
|
|
baseNode.SetMaxQueueLength(maxQueueLength)
|
|
baseNode.SetMaxParallelism(maxParallelism)
|
|
|
|
return &InputNode{
|
|
BaseNode: baseNode,
|
|
input: input,
|
|
name: nodeName,
|
|
role: role,
|
|
nodeID: nodeID,
|
|
collectionID: collectionID,
|
|
dataType: dataType,
|
|
closeGracefully: atomic.NewBool(CloseImmediately),
|
|
skipCount: 0,
|
|
lastNotTimetickTime: time.Now(),
|
|
}
|
|
}
|