mirror of
https://gitee.com/milvus-io/milvus.git
synced 2024-12-05 05:18:52 +08:00
dd4dfbcd8d
This PR cherry-picks the following commits related to data codec - Fix data codec writer close. #33818 - Legacy code clean up. #33838 issue: #33813 #33839 pr: #33818 #33838 Signed-off-by: shaoting-huang <shaoting.huang@zilliz.com>
218 lines
5.3 KiB
Go
218 lines
5.3 KiB
Go
// Licensed to the LF AI & Data foundation under one
|
|
// or more contributor license agreements. See the NOTICE file
|
|
// distributed with this work for additional information
|
|
// regarding copyright ownership. The ASF licenses this file
|
|
// to you under the Apache License, Version 2.0 (the
|
|
// "License"); you may not use this file except in compliance
|
|
// with the License. You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
package storage
|
|
|
|
import (
|
|
"sync/atomic"
|
|
|
|
"github.com/cockroachdb/errors"
|
|
|
|
"github.com/milvus-io/milvus-proto/go-api/v2/schemapb"
|
|
"github.com/milvus-io/milvus/pkg/common"
|
|
)
|
|
|
|
var (
|
|
// ErrNoMoreRecord is the error that the iterator does not have next record.
|
|
ErrNoMoreRecord = errors.New("no more record")
|
|
// ErrDisposed is the error that the iterator is disposed.
|
|
ErrDisposed = errors.New("iterator is disposed")
|
|
)
|
|
|
|
// Iterator is the iterator interface.
|
|
type Iterator interface {
|
|
// HasNext returns true if the iterator have unread record
|
|
HasNext() bool
|
|
// Next returns the next record
|
|
Next() (interface{}, error)
|
|
// Dispose disposes the iterator
|
|
Dispose()
|
|
}
|
|
|
|
// Value is the return value of Next
|
|
type Value struct {
|
|
ID int64
|
|
PK PrimaryKey
|
|
Timestamp int64
|
|
IsDeleted bool
|
|
Value interface{}
|
|
}
|
|
|
|
// InsertBinlogIterator is the iterator of binlog
|
|
type InsertBinlogIterator struct {
|
|
dispose int32 // 0: false, 1: true
|
|
data *InsertData
|
|
PKfieldID int64
|
|
PkType schemapb.DataType
|
|
pos int
|
|
}
|
|
|
|
// NewInsertBinlogIterator creates a new iterator
|
|
//
|
|
// Deprecated: use storage.NewBinlogDeserializeReader instead
|
|
func NewInsertBinlogIterator(blobs []*Blob, PKfieldID UniqueID, pkType schemapb.DataType) (*InsertBinlogIterator, error) {
|
|
// TODO: load part of file to read records other than loading all content
|
|
reader := NewInsertCodecWithSchema(nil)
|
|
|
|
_, _, serData, err := reader.Deserialize(blobs)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
return &InsertBinlogIterator{data: serData, PKfieldID: PKfieldID, PkType: pkType}, nil
|
|
}
|
|
|
|
// HasNext returns true if the iterator have unread record
|
|
func (itr *InsertBinlogIterator) HasNext() bool {
|
|
return !itr.isDisposed() && itr.hasNext()
|
|
}
|
|
|
|
// Next returns the next record
|
|
func (itr *InsertBinlogIterator) Next() (interface{}, error) {
|
|
if itr.isDisposed() {
|
|
return nil, ErrDisposed
|
|
}
|
|
|
|
if !itr.hasNext() {
|
|
return nil, ErrNoMoreRecord
|
|
}
|
|
|
|
m := make(map[FieldID]interface{})
|
|
for fieldID, fieldData := range itr.data.Data {
|
|
m[fieldID] = fieldData.GetRow(itr.pos)
|
|
}
|
|
pk, err := GenPrimaryKeyByRawData(itr.data.Data[itr.PKfieldID].GetRow(itr.pos), itr.PkType)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
v := &Value{
|
|
ID: itr.data.Data[common.RowIDField].GetRow(itr.pos).(int64),
|
|
Timestamp: itr.data.Data[common.TimeStampField].GetRow(itr.pos).(int64),
|
|
PK: pk,
|
|
IsDeleted: false,
|
|
Value: m,
|
|
}
|
|
itr.pos++
|
|
return v, nil
|
|
}
|
|
|
|
// Dispose disposes the iterator
|
|
func (itr *InsertBinlogIterator) Dispose() {
|
|
atomic.CompareAndSwapInt32(&itr.dispose, 0, 1)
|
|
}
|
|
|
|
func (itr *InsertBinlogIterator) hasNext() bool {
|
|
_, ok := itr.data.Data[common.RowIDField]
|
|
if !ok {
|
|
return false
|
|
}
|
|
return itr.pos < itr.data.Data[common.RowIDField].RowNum()
|
|
}
|
|
|
|
func (itr *InsertBinlogIterator) isDisposed() bool {
|
|
return atomic.LoadInt32(&itr.dispose) == 1
|
|
}
|
|
|
|
// MergeIterator merge iterators.
|
|
type MergeIterator struct {
|
|
disposed int32
|
|
pos int
|
|
iteraotrs []Iterator
|
|
tmpRecords []*Value
|
|
nextRecord *Value
|
|
}
|
|
|
|
// NewMergeIterator return a new MergeIterator.
|
|
func NewMergeIterator(iterators []Iterator) *MergeIterator {
|
|
return &MergeIterator{
|
|
iteraotrs: iterators,
|
|
tmpRecords: make([]*Value, len(iterators)),
|
|
}
|
|
}
|
|
|
|
// HasNext returns true if the iterator have unread record
|
|
func (itr *MergeIterator) HasNext() bool {
|
|
return !itr.isDisposed() && itr.hasNext()
|
|
}
|
|
|
|
// Next returns the next record
|
|
func (itr *MergeIterator) Next() (interface{}, error) {
|
|
if itr.isDisposed() {
|
|
return nil, ErrDisposed
|
|
}
|
|
|
|
if !itr.hasNext() {
|
|
return nil, ErrNoMoreRecord
|
|
}
|
|
|
|
tmpRecord := itr.nextRecord
|
|
itr.nextRecord = nil
|
|
return tmpRecord, nil
|
|
}
|
|
|
|
// Dispose disposes the iterator
|
|
func (itr *MergeIterator) Dispose() {
|
|
if itr.isDisposed() {
|
|
return
|
|
}
|
|
|
|
for _, tmpItr := range itr.iteraotrs {
|
|
if tmpItr != nil {
|
|
tmpItr.Dispose()
|
|
}
|
|
}
|
|
atomic.CompareAndSwapInt32(&itr.disposed, 0, 1)
|
|
}
|
|
|
|
func (itr *MergeIterator) isDisposed() bool {
|
|
return atomic.LoadInt32(&itr.disposed) == 1
|
|
}
|
|
|
|
func (itr *MergeIterator) hasNext() bool {
|
|
if itr.nextRecord != nil {
|
|
return true
|
|
}
|
|
|
|
var minRecord *Value
|
|
var minPos int
|
|
for i, tmpRecord := range itr.tmpRecords {
|
|
if tmpRecord == nil {
|
|
if itr.iteraotrs[i] != nil && itr.iteraotrs[i].HasNext() {
|
|
next, _ := itr.iteraotrs[i].Next()
|
|
itr.tmpRecords[i] = next.(*Value)
|
|
tmpRecord = itr.tmpRecords[i]
|
|
}
|
|
}
|
|
if tmpRecord == nil {
|
|
continue
|
|
}
|
|
if minRecord == nil || tmpRecord.ID < minRecord.ID {
|
|
minRecord = tmpRecord
|
|
minPos = i
|
|
}
|
|
}
|
|
|
|
if minRecord == nil {
|
|
// all iterators have no more records
|
|
return false
|
|
}
|
|
|
|
itr.tmpRecords[minPos] = nil
|
|
itr.nextRecord = minRecord
|
|
return true
|
|
}
|