mirror of
https://gitee.com/milvus-io/milvus.git
synced 2024-12-04 21:09:06 +08:00
189ac881f3
* Remove redundant session startup Signed-off-by: sunby <bingyi.sun@zilliz.com> * Register datanode after start success Signed-off-by: sunby <bingyi.sun@zilliz.com> * fix meta snap shot Signed-off-by: yefu.chen <yefu.chen@zilliz.com> * fix datanode message stream channel Signed-off-by: yangxuan <xuan.yang@zilliz.com> * Fix bugs when drop empty collection Signed-off-by: sunby <bingyi.sun@zilliz.com> * Fix bug of getting pchan statistics from task scheduler Signed-off-by: dragondriver <jiquan.long@zilliz.com> * Fix i/dist/dataservice test code Signed-off-by: Congqi Xia <congqi.xia@zilliz.com> * Fix epoch lifetime not applied Signed-off-by: Congqi Xia <congqi.xia@zilliz.com> * fix datanode flowgraph dd node Signed-off-by: yangxuan <xuan.yang@zilliz.com> * Fix handle datanode timetick bug Signed-off-by: sunby <bingyi.sun@zilliz.com> * Remove repack function of dml stream Signed-off-by: dragondriver <jiquan.long@zilliz.com> * fix proxynode Signed-off-by: yefu.chen <yefu.chen@zilliz.com> * Apply extended seal policy Signed-off-by: Congqi Xia <congqi.xia@zilliz.com> * add check for time tick Signed-off-by: yefu.chen <yefu.chen@zilliz.com> * fix check Signed-off-by: yefu.chen <yefu.chen@zilliz.com> * Fix the repack function of dml stream Signed-off-by: dragondriver <jiquan.long@zilliz.com> * Fix the bug when send statistics of pchan Signed-off-by: dragondriver <jiquan.long@zilliz.com> * Fix the repack function when craete dml stream Signed-off-by: dragondriver <jiquan.long@zilliz.com> * fix bugs Signed-off-by: yefu.chen <yefu.chen@zilliz.com> * fix describe collection Signed-off-by: yefu.chen <yefu.chen@zilliz.com> * Fix bug when send timestamp statistics Signed-off-by: dragondriver <jiquan.long@zilliz.com> * fix data node Signed-off-by: yefu.chen <yefu.chen@zilliz.com> * Add length check before flush request Signed-off-by: Congqi Xia <congqi.xia@zilliz.com> * add log for data node Signed-off-by: yefu.chen <yefu.chen@zilliz.com> * Fix SaveBinlog bugs Signed-off-by: sunby <bingyi.sun@zilliz.com> * Add more log in datanode Signed-off-by: yangxuan <xuan.yang@zilliz.com> * Put SegmentState.Flushing as the last one in enum to fit the client Signed-off-by: sunby <bingyi.sun@zilliz.com> * Fix params in GetInsertBinlogPaths Signed-off-by: sunby <bingyi.sun@zilliz.com> * Rename policy Signed-off-by: sunby <bingyi.sun@zilliz.com> * Remove unused ddl functions and fields Signed-off-by: Congqi Xia <congqi.xia@zilliz.com> * Remove pchan when drop collection Signed-off-by: dragondriver <jiquan.long@zilliz.com> * Add balanced assignment policy Signed-off-by: sunby <bingyi.sun@zilliz.com> * fix master ut Signed-off-by: yefu.chen <yefu.chen@zilliz.com> * Add lock in session manager Signed-off-by: Congqi Xia <congqi.xia@zilliz.com> * add log for debug Signed-off-by: yefu.chen <yefu.chen@zilliz.com> * Fix some logic bug and typo Signed-off-by: Congqi Xia <congqi.xia@zilliz.com> * Fix recover bugs Signed-off-by: sunby <bingyi.sun@zilliz.com> * Get collection scheme of a specific timestamp Signed-off-by: yangxuan <xuan.yang@zilliz.com> * Change CheckPoint to SegmentInfo in VchannelInfo Signed-off-by: sunby <bingyi.sun@zilliz.com> * Recover Unflushed segment numOfRows Signed-off-by: yangxuan <xuan.yang@zilliz.com> * Fix dataservice unit tests Signed-off-by: sunby <bingyi.sun@zilliz.com> Co-authored-by: yefu.chen <yefu.chen@zilliz.com> Co-authored-by: yangxuan <xuan.yang@zilliz.com> Co-authored-by: dragondriver <jiquan.long@zilliz.com> Co-authored-by: Congqi Xia <congqi.xia@zilliz.com>
132 lines
4.0 KiB
Go
132 lines
4.0 KiB
Go
// Copyright (C) 2019-2020 Zilliz. All rights reserved.
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance
|
|
// with the License. You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software distributed under the License
|
|
// is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express
|
|
// or implied. See the License for the specific language governing permissions and limitations under the License.
|
|
|
|
package dataservice
|
|
|
|
import (
|
|
"sort"
|
|
|
|
"github.com/milvus-io/milvus/internal/proto/schemapb"
|
|
"github.com/milvus-io/milvus/internal/util/typeutil"
|
|
)
|
|
|
|
type calUpperLimitPolicy interface {
|
|
// apply accept collection schema and return max number of rows per segment
|
|
apply(schema *schemapb.CollectionSchema) (int, error)
|
|
}
|
|
|
|
type calBySchemaPolicy struct {
|
|
}
|
|
|
|
func (p *calBySchemaPolicy) apply(schema *schemapb.CollectionSchema) (int, error) {
|
|
sizePerRecord, err := typeutil.EstimateSizePerRecord(schema)
|
|
if err != nil {
|
|
return -1, err
|
|
}
|
|
threshold := Params.SegmentSize * 1024 * 1024
|
|
return int(threshold / float64(sizePerRecord)), nil
|
|
}
|
|
|
|
func newCalBySchemaPolicy() calUpperLimitPolicy {
|
|
return &calBySchemaPolicy{}
|
|
}
|
|
|
|
type allocatePolicy interface {
|
|
apply(maxCount, writtenCount, allocatedCount, count int64) bool
|
|
}
|
|
|
|
type allocatePolicyV1 struct {
|
|
}
|
|
|
|
func (p *allocatePolicyV1) apply(maxCount, writtenCount, allocatedCount, count int64) bool {
|
|
free := maxCount - writtenCount - allocatedCount
|
|
return free >= count
|
|
}
|
|
|
|
func newAllocatePolicyV1() allocatePolicy {
|
|
return &allocatePolicyV1{}
|
|
}
|
|
|
|
type sealPolicy interface {
|
|
apply(maxCount, writtenCount, allocatedCount int64) bool
|
|
}
|
|
|
|
// segmentSealPolicy seal policy applies to segment
|
|
type segmentSealPolicy func(*segmentStatus, Timestamp) bool
|
|
|
|
// channelSealPolicy seal policy applies to channel
|
|
type channelSealPolicy func(string, []*segmentStatus, Timestamp) []*segmentStatus
|
|
|
|
// getSegmentCapacityPolicy get segmentSealPolicy with segment size factor policy
|
|
func getSegmentCapacityPolicy(sizeFactor float64) segmentSealPolicy {
|
|
return func(status *segmentStatus, ts Timestamp) bool {
|
|
var allocSize int64
|
|
for _, allocation := range status.allocations {
|
|
allocSize += allocation.rowNums
|
|
}
|
|
// max, written, allocated := status.total, status.currentRows, allocSize
|
|
// float64(writtenCount) >= Params.SegmentSizeFactor*float64(maxCount)
|
|
return float64(status.currentRows) >= sizeFactor*float64(status.total)
|
|
}
|
|
}
|
|
|
|
// getLastExpiresLifetimePolicy get segmentSealPolicy with lifetime limit compares ts - segment.lastExpireTime
|
|
func getLastExpiresLifetimePolicy(lifetime uint64) segmentSealPolicy {
|
|
return func(status *segmentStatus, ts Timestamp) bool {
|
|
return (ts - status.lastExpireTime) > lifetime
|
|
}
|
|
}
|
|
|
|
// getChannelCapacityPolicy get channelSealPolicy with channel segment capacity policy
|
|
func getChannelOpenSegCapacityPolicy(limit int) channelSealPolicy {
|
|
return func(channel string, segs []*segmentStatus, ts Timestamp) []*segmentStatus {
|
|
if len(segs) <= limit {
|
|
return []*segmentStatus{}
|
|
}
|
|
sortSegStatusByLastExpires(segs)
|
|
offLen := len(segs) - limit
|
|
return segs[0:offLen]
|
|
}
|
|
}
|
|
|
|
// sortSegStatusByLastExpires sort segmentStatus with lastExpireTime ascending order
|
|
func sortSegStatusByLastExpires(segs []*segmentStatus) {
|
|
sort.Slice(segs, func(i, j int) bool {
|
|
return segs[i].lastExpireTime < segs[j].lastExpireTime
|
|
})
|
|
}
|
|
|
|
type sealPolicyV1 struct {
|
|
}
|
|
|
|
func (p *sealPolicyV1) apply(maxCount, writtenCount, allocatedCount int64) bool {
|
|
return float64(writtenCount) >= Params.SegmentSizeFactor*float64(maxCount)
|
|
}
|
|
|
|
func newSealPolicyV1() sealPolicy {
|
|
return &sealPolicyV1{}
|
|
}
|
|
|
|
type flushPolicy interface {
|
|
apply(status *segmentStatus, t Timestamp) bool
|
|
}
|
|
|
|
type flushPolicyV1 struct {
|
|
}
|
|
|
|
func (p *flushPolicyV1) apply(status *segmentStatus, t Timestamp) bool {
|
|
return status.sealed && status.lastExpireTime <= t
|
|
}
|
|
|
|
func newFlushPolicyV1() flushPolicy {
|
|
return &flushPolicyV1{}
|
|
}
|