mirror of
https://gitee.com/milvus-io/milvus.git
synced 2024-12-02 11:59:00 +08:00
0b905078e7
See also #27675 This PR make previously merged refactory of datanode go online - Use write node to replace insert/delete node - Use write buffer manager to control all buffers - Use sync manager to control sync tasks instead of flush manager Signed-off-by: Congqi Xia <congqi.xia@zilliz.com>
195 lines
5.6 KiB
Go
195 lines
5.6 KiB
Go
// Licensed to the LF AI & Data foundation under one
|
|
// or more contributor license agreements. See the NOTICE file
|
|
// distributed with this work for additional information
|
|
// regarding copyright ownership. The ASF licenses this file
|
|
// to you under the Apache License, Version 2.0 (the
|
|
// "License"); you may not use this file except in compliance
|
|
// with the License. You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
package datanode
|
|
|
|
import (
|
|
"context"
|
|
"fmt"
|
|
"sync"
|
|
"time"
|
|
|
|
"go.uber.org/zap"
|
|
|
|
"github.com/milvus-io/milvus-proto/go-api/v2/schemapb"
|
|
"github.com/milvus-io/milvus/internal/proto/datapb"
|
|
"github.com/milvus-io/milvus/pkg/log"
|
|
"github.com/milvus-io/milvus/pkg/metrics"
|
|
"github.com/milvus-io/milvus/pkg/util/hardware"
|
|
"github.com/milvus-io/milvus/pkg/util/paramtable"
|
|
"github.com/milvus-io/milvus/pkg/util/typeutil"
|
|
)
|
|
|
|
type flowgraphManager struct {
|
|
flowgraphs *typeutil.ConcurrentMap[string, *dataSyncService]
|
|
|
|
closeCh chan struct{}
|
|
closeOnce sync.Once
|
|
}
|
|
|
|
func newFlowgraphManager() *flowgraphManager {
|
|
return &flowgraphManager{
|
|
flowgraphs: typeutil.NewConcurrentMap[string, *dataSyncService](),
|
|
closeCh: make(chan struct{}),
|
|
}
|
|
}
|
|
|
|
func (fm *flowgraphManager) start(waiter *sync.WaitGroup) {
|
|
defer waiter.Done()
|
|
ticker := time.NewTicker(3 * time.Second)
|
|
defer ticker.Stop()
|
|
for {
|
|
select {
|
|
case <-fm.closeCh:
|
|
return
|
|
case <-ticker.C:
|
|
fm.execute(hardware.GetMemoryCount())
|
|
}
|
|
}
|
|
}
|
|
|
|
func (fm *flowgraphManager) close() {
|
|
fm.dropAll()
|
|
fm.closeOnce.Do(func() {
|
|
close(fm.closeCh)
|
|
})
|
|
}
|
|
|
|
func (fm *flowgraphManager) execute(totalMemory uint64) {
|
|
if !Params.DataNodeCfg.MemoryForceSyncEnable.GetAsBool() {
|
|
return
|
|
}
|
|
// TODO change to buffer manager
|
|
|
|
/*
|
|
var total int64
|
|
channels := make([]struct {
|
|
channel string
|
|
bufferSize int64
|
|
}, 0)
|
|
fm.flowgraphs.Range(func(key string, value *dataSyncService) bool {
|
|
size := value.channel.getTotalMemorySize()
|
|
channels = append(channels, struct {
|
|
channel string
|
|
bufferSize int64
|
|
}{key, size})
|
|
total += size
|
|
return true
|
|
})
|
|
if len(channels) == 0 {
|
|
return
|
|
}
|
|
|
|
toMB := func(mem float64) float64 {
|
|
return mem / 1024 / 1024
|
|
}
|
|
|
|
memoryWatermark := float64(totalMemory) * Params.DataNodeCfg.MemoryWatermark.GetAsFloat()
|
|
if float64(total) < memoryWatermark {
|
|
log.RatedDebug(5, "skip force sync because memory level is not high enough",
|
|
zap.Float64("current_total_memory_usage", toMB(float64(total))),
|
|
zap.Float64("current_memory_watermark", toMB(memoryWatermark)),
|
|
zap.Any("channel_memory_usages", channels))
|
|
return
|
|
}
|
|
|
|
sort.Slice(channels, func(i, j int) bool {
|
|
return channels[i].bufferSize > channels[j].bufferSize
|
|
})
|
|
if fg, ok := fm.flowgraphs.Get(channels[0].channel); ok { // sync the first channel with the largest memory usage
|
|
fg.channel.setIsHighMemory(true)
|
|
log.Info("notify flowgraph to sync",
|
|
zap.String("channel", channels[0].channel), zap.Int64("bufferSize", channels[0].bufferSize))
|
|
}*/
|
|
}
|
|
|
|
func (fm *flowgraphManager) Add(ds *dataSyncService) {
|
|
fm.flowgraphs.Insert(ds.vchannelName, ds)
|
|
metrics.DataNodeNumFlowGraphs.WithLabelValues(fmt.Sprint(paramtable.GetNodeID())).Inc()
|
|
}
|
|
|
|
func (fm *flowgraphManager) addAndStartWithEtcdTickler(dn *DataNode, vchan *datapb.VchannelInfo, schema *schemapb.CollectionSchema, tickler *etcdTickler) error {
|
|
log := log.With(zap.String("channel", vchan.GetChannelName()))
|
|
if fm.flowgraphs.Contain(vchan.GetChannelName()) {
|
|
log.Warn("try to add an existed DataSyncService")
|
|
return nil
|
|
}
|
|
|
|
dataSyncService, err := newServiceWithEtcdTickler(context.TODO(), dn, &datapb.ChannelWatchInfo{
|
|
Schema: schema,
|
|
Vchan: vchan,
|
|
}, tickler)
|
|
if err != nil {
|
|
log.Warn("fail to create new DataSyncService", zap.Error(err))
|
|
return err
|
|
}
|
|
dataSyncService.start()
|
|
fm.flowgraphs.Insert(vchan.GetChannelName(), dataSyncService)
|
|
|
|
metrics.DataNodeNumFlowGraphs.WithLabelValues(fmt.Sprint(paramtable.GetNodeID())).Inc()
|
|
return nil
|
|
}
|
|
|
|
func (fm *flowgraphManager) release(vchanName string) {
|
|
if fg, loaded := fm.flowgraphs.Get(vchanName); loaded {
|
|
fg.close()
|
|
fm.flowgraphs.Remove(vchanName)
|
|
|
|
metrics.DataNodeNumFlowGraphs.WithLabelValues(fmt.Sprint(paramtable.GetNodeID())).Dec()
|
|
rateCol.removeFlowGraphChannel(vchanName)
|
|
}
|
|
}
|
|
|
|
func (fm *flowgraphManager) getFlowgraphService(vchan string) (*dataSyncService, bool) {
|
|
return fm.flowgraphs.Get(vchan)
|
|
}
|
|
|
|
func (fm *flowgraphManager) exist(vchan string) bool {
|
|
_, exist := fm.getFlowgraphService(vchan)
|
|
return exist
|
|
}
|
|
|
|
func (fm *flowgraphManager) existWithOpID(vchan string, opID UniqueID) bool {
|
|
ds, exist := fm.getFlowgraphService(vchan)
|
|
return exist && ds.opID == opID
|
|
}
|
|
|
|
// getFlowGraphNum returns number of flow graphs.
|
|
func (fm *flowgraphManager) getFlowGraphNum() int {
|
|
return fm.flowgraphs.Len()
|
|
}
|
|
|
|
func (fm *flowgraphManager) dropAll() {
|
|
log.Info("start drop all flowgraph resources in DataNode")
|
|
fm.flowgraphs.Range(func(key string, value *dataSyncService) bool {
|
|
value.GracefullyClose()
|
|
fm.flowgraphs.GetAndRemove(key)
|
|
|
|
log.Info("successfully dropped flowgraph", zap.String("vChannelName", key))
|
|
return true
|
|
})
|
|
}
|
|
|
|
func (fm *flowgraphManager) collections() []int64 {
|
|
collectionSet := typeutil.UniqueSet{}
|
|
fm.flowgraphs.Range(func(key string, value *dataSyncService) bool {
|
|
collectionSet.Insert(value.metacache.Collection())
|
|
return true
|
|
})
|
|
|
|
return collectionSet.Collect()
|
|
}
|