mirror of
https://gitee.com/milvus-io/milvus.git
synced 2024-12-05 05:18:52 +08:00
f4c643f1bd
Signed-off-by: sunby <bingyi.sun@zilliz.com>
853 lines
21 KiB
Go
853 lines
21 KiB
Go
package querynode
|
|
|
|
import (
|
|
"context"
|
|
"encoding/binary"
|
|
"log"
|
|
"math"
|
|
"testing"
|
|
|
|
"github.com/golang/protobuf/proto"
|
|
"github.com/stretchr/testify/assert"
|
|
|
|
"github.com/zilliztech/milvus-distributed/internal/msgstream"
|
|
"github.com/zilliztech/milvus-distributed/internal/proto/commonpb"
|
|
"github.com/zilliztech/milvus-distributed/internal/proto/etcdpb"
|
|
"github.com/zilliztech/milvus-distributed/internal/proto/schemapb"
|
|
"github.com/zilliztech/milvus-distributed/internal/proto/servicepb"
|
|
)
|
|
|
|
//-------------------------------------------------------------------------------------- constructor and destructor
|
|
func TestSegment_newSegment(t *testing.T) {
|
|
fieldVec := schemapb.FieldSchema{
|
|
Name: "vec",
|
|
DataType: schemapb.DataType_VECTOR_FLOAT,
|
|
TypeParams: []*commonpb.KeyValuePair{
|
|
{
|
|
Key: "dim",
|
|
Value: "16",
|
|
},
|
|
},
|
|
}
|
|
|
|
fieldInt := schemapb.FieldSchema{
|
|
Name: "age",
|
|
DataType: schemapb.DataType_INT32,
|
|
TypeParams: []*commonpb.KeyValuePair{
|
|
{
|
|
Key: "dim",
|
|
Value: "1",
|
|
},
|
|
},
|
|
}
|
|
|
|
schema := schemapb.CollectionSchema{
|
|
Name: "collection0",
|
|
Fields: []*schemapb.FieldSchema{
|
|
&fieldVec, &fieldInt,
|
|
},
|
|
}
|
|
|
|
collectionMeta := etcdpb.CollectionMeta{
|
|
ID: UniqueID(0),
|
|
Schema: &schema,
|
|
CreateTime: Timestamp(0),
|
|
SegmentIDs: []UniqueID{0},
|
|
PartitionTags: []string{"default"},
|
|
}
|
|
|
|
collectionMetaBlob := proto.MarshalTextString(&collectionMeta)
|
|
assert.NotEqual(t, "", collectionMetaBlob)
|
|
|
|
collection := newCollection(&collectionMeta, collectionMetaBlob)
|
|
assert.Equal(t, collection.meta.Schema.Name, "collection0")
|
|
assert.Equal(t, collection.meta.ID, UniqueID(0))
|
|
|
|
segmentID := UniqueID(0)
|
|
segment := newSegment(collection, segmentID)
|
|
assert.Equal(t, segmentID, segment.segmentID)
|
|
deleteSegment(segment)
|
|
deleteCollection(collection)
|
|
}
|
|
|
|
func TestSegment_deleteSegment(t *testing.T) {
|
|
fieldVec := schemapb.FieldSchema{
|
|
Name: "vec",
|
|
DataType: schemapb.DataType_VECTOR_FLOAT,
|
|
TypeParams: []*commonpb.KeyValuePair{
|
|
{
|
|
Key: "dim",
|
|
Value: "16",
|
|
},
|
|
},
|
|
}
|
|
|
|
fieldInt := schemapb.FieldSchema{
|
|
Name: "age",
|
|
DataType: schemapb.DataType_INT32,
|
|
TypeParams: []*commonpb.KeyValuePair{
|
|
{
|
|
Key: "dim",
|
|
Value: "1",
|
|
},
|
|
},
|
|
}
|
|
|
|
schema := schemapb.CollectionSchema{
|
|
Name: "collection0",
|
|
Fields: []*schemapb.FieldSchema{
|
|
&fieldVec, &fieldInt,
|
|
},
|
|
}
|
|
|
|
collectionMeta := etcdpb.CollectionMeta{
|
|
ID: UniqueID(0),
|
|
Schema: &schema,
|
|
CreateTime: Timestamp(0),
|
|
SegmentIDs: []UniqueID{0},
|
|
PartitionTags: []string{"default"},
|
|
}
|
|
|
|
collectionMetaBlob := proto.MarshalTextString(&collectionMeta)
|
|
assert.NotEqual(t, "", collectionMetaBlob)
|
|
|
|
collection := newCollection(&collectionMeta, collectionMetaBlob)
|
|
assert.Equal(t, collection.meta.Schema.Name, "collection0")
|
|
assert.Equal(t, collection.meta.ID, UniqueID(0))
|
|
|
|
segmentID := UniqueID(0)
|
|
segment := newSegment(collection, segmentID)
|
|
assert.Equal(t, segmentID, segment.segmentID)
|
|
|
|
deleteSegment(segment)
|
|
deleteCollection(collection)
|
|
}
|
|
|
|
//-------------------------------------------------------------------------------------- stats functions
|
|
func TestSegment_getRowCount(t *testing.T) {
|
|
fieldVec := schemapb.FieldSchema{
|
|
Name: "vec",
|
|
DataType: schemapb.DataType_VECTOR_FLOAT,
|
|
TypeParams: []*commonpb.KeyValuePair{
|
|
{
|
|
Key: "dim",
|
|
Value: "16",
|
|
},
|
|
},
|
|
}
|
|
|
|
fieldInt := schemapb.FieldSchema{
|
|
Name: "age",
|
|
DataType: schemapb.DataType_INT32,
|
|
TypeParams: []*commonpb.KeyValuePair{
|
|
{
|
|
Key: "dim",
|
|
Value: "1",
|
|
},
|
|
},
|
|
}
|
|
|
|
schema := schemapb.CollectionSchema{
|
|
Name: "collection0",
|
|
Fields: []*schemapb.FieldSchema{
|
|
&fieldVec, &fieldInt,
|
|
},
|
|
}
|
|
|
|
collectionMeta := etcdpb.CollectionMeta{
|
|
ID: UniqueID(0),
|
|
Schema: &schema,
|
|
CreateTime: Timestamp(0),
|
|
SegmentIDs: []UniqueID{0},
|
|
PartitionTags: []string{"default"},
|
|
}
|
|
|
|
collectionMetaBlob := proto.MarshalTextString(&collectionMeta)
|
|
assert.NotEqual(t, "", collectionMetaBlob)
|
|
|
|
collection := newCollection(&collectionMeta, collectionMetaBlob)
|
|
assert.Equal(t, collection.meta.Schema.Name, "collection0")
|
|
assert.Equal(t, collection.meta.ID, UniqueID(0))
|
|
|
|
segmentID := UniqueID(0)
|
|
segment := newSegment(collection, segmentID)
|
|
assert.Equal(t, segmentID, segment.segmentID)
|
|
|
|
ids := []int64{1, 2, 3}
|
|
timestamps := []uint64{0, 0, 0}
|
|
|
|
const DIM = 16
|
|
const N = 3
|
|
var vec = [DIM]float32{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16}
|
|
var rawData []byte
|
|
for _, ele := range vec {
|
|
buf := make([]byte, 4)
|
|
binary.LittleEndian.PutUint32(buf, math.Float32bits(ele))
|
|
rawData = append(rawData, buf...)
|
|
}
|
|
bs := make([]byte, 4)
|
|
binary.LittleEndian.PutUint32(bs, 1)
|
|
rawData = append(rawData, bs...)
|
|
var records []*commonpb.Blob
|
|
for i := 0; i < N; i++ {
|
|
blob := &commonpb.Blob{
|
|
Value: rawData,
|
|
}
|
|
records = append(records, blob)
|
|
}
|
|
|
|
var offset = segment.segmentPreInsert(N)
|
|
assert.GreaterOrEqual(t, offset, int64(0))
|
|
|
|
err := segment.segmentInsert(offset, &ids, ×tamps, &records)
|
|
assert.NoError(t, err)
|
|
|
|
rowCount := segment.getRowCount()
|
|
assert.Equal(t, int64(N), rowCount)
|
|
|
|
deleteSegment(segment)
|
|
deleteCollection(collection)
|
|
}
|
|
|
|
func TestSegment_getDeletedCount(t *testing.T) {
|
|
fieldVec := schemapb.FieldSchema{
|
|
Name: "vec",
|
|
DataType: schemapb.DataType_VECTOR_FLOAT,
|
|
TypeParams: []*commonpb.KeyValuePair{
|
|
{
|
|
Key: "dim",
|
|
Value: "16",
|
|
},
|
|
},
|
|
}
|
|
|
|
fieldInt := schemapb.FieldSchema{
|
|
Name: "age",
|
|
DataType: schemapb.DataType_INT32,
|
|
TypeParams: []*commonpb.KeyValuePair{
|
|
{
|
|
Key: "dim",
|
|
Value: "1",
|
|
},
|
|
},
|
|
}
|
|
|
|
schema := schemapb.CollectionSchema{
|
|
Name: "collection0",
|
|
Fields: []*schemapb.FieldSchema{
|
|
&fieldVec, &fieldInt,
|
|
},
|
|
}
|
|
|
|
collectionMeta := etcdpb.CollectionMeta{
|
|
ID: UniqueID(0),
|
|
Schema: &schema,
|
|
CreateTime: Timestamp(0),
|
|
SegmentIDs: []UniqueID{0},
|
|
PartitionTags: []string{"default"},
|
|
}
|
|
|
|
collectionMetaBlob := proto.MarshalTextString(&collectionMeta)
|
|
assert.NotEqual(t, "", collectionMetaBlob)
|
|
|
|
collection := newCollection(&collectionMeta, collectionMetaBlob)
|
|
assert.Equal(t, collection.meta.Schema.Name, "collection0")
|
|
assert.Equal(t, collection.meta.ID, UniqueID(0))
|
|
|
|
segmentID := UniqueID(0)
|
|
segment := newSegment(collection, segmentID)
|
|
assert.Equal(t, segmentID, segment.segmentID)
|
|
|
|
ids := []int64{1, 2, 3}
|
|
timestamps := []uint64{0, 0, 0}
|
|
|
|
const DIM = 16
|
|
const N = 3
|
|
var vec = [DIM]float32{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16}
|
|
var rawData []byte
|
|
for _, ele := range vec {
|
|
buf := make([]byte, 4)
|
|
binary.LittleEndian.PutUint32(buf, math.Float32bits(ele))
|
|
rawData = append(rawData, buf...)
|
|
}
|
|
bs := make([]byte, 4)
|
|
binary.LittleEndian.PutUint32(bs, 1)
|
|
rawData = append(rawData, bs...)
|
|
var records []*commonpb.Blob
|
|
for i := 0; i < N; i++ {
|
|
blob := &commonpb.Blob{
|
|
Value: rawData,
|
|
}
|
|
records = append(records, blob)
|
|
}
|
|
|
|
var offsetInsert = segment.segmentPreInsert(N)
|
|
assert.GreaterOrEqual(t, offsetInsert, int64(0))
|
|
|
|
var err = segment.segmentInsert(offsetInsert, &ids, ×tamps, &records)
|
|
assert.NoError(t, err)
|
|
|
|
var offsetDelete = segment.segmentPreDelete(10)
|
|
assert.GreaterOrEqual(t, offsetDelete, int64(0))
|
|
|
|
err = segment.segmentDelete(offsetDelete, &ids, ×tamps)
|
|
assert.NoError(t, err)
|
|
|
|
var deletedCount = segment.getDeletedCount()
|
|
// TODO: assert.Equal(t, deletedCount, len(ids))
|
|
assert.Equal(t, deletedCount, int64(0))
|
|
|
|
deleteCollection(collection)
|
|
}
|
|
|
|
func TestSegment_getMemSize(t *testing.T) {
|
|
fieldVec := schemapb.FieldSchema{
|
|
Name: "vec",
|
|
DataType: schemapb.DataType_VECTOR_FLOAT,
|
|
TypeParams: []*commonpb.KeyValuePair{
|
|
{
|
|
Key: "dim",
|
|
Value: "16",
|
|
},
|
|
},
|
|
}
|
|
|
|
fieldInt := schemapb.FieldSchema{
|
|
Name: "age",
|
|
DataType: schemapb.DataType_INT32,
|
|
TypeParams: []*commonpb.KeyValuePair{
|
|
{
|
|
Key: "dim",
|
|
Value: "1",
|
|
},
|
|
},
|
|
}
|
|
|
|
schema := schemapb.CollectionSchema{
|
|
Name: "collection0",
|
|
Fields: []*schemapb.FieldSchema{
|
|
&fieldVec, &fieldInt,
|
|
},
|
|
}
|
|
|
|
collectionMeta := etcdpb.CollectionMeta{
|
|
ID: UniqueID(0),
|
|
Schema: &schema,
|
|
CreateTime: Timestamp(0),
|
|
SegmentIDs: []UniqueID{0},
|
|
PartitionTags: []string{"default"},
|
|
}
|
|
|
|
collectionMetaBlob := proto.MarshalTextString(&collectionMeta)
|
|
assert.NotEqual(t, "", collectionMetaBlob)
|
|
|
|
collection := newCollection(&collectionMeta, collectionMetaBlob)
|
|
assert.Equal(t, collection.meta.Schema.Name, "collection0")
|
|
assert.Equal(t, collection.meta.ID, UniqueID(0))
|
|
|
|
segmentID := UniqueID(0)
|
|
segment := newSegment(collection, segmentID)
|
|
assert.Equal(t, segmentID, segment.segmentID)
|
|
|
|
ids := []int64{1, 2, 3}
|
|
timestamps := []uint64{0, 0, 0}
|
|
|
|
const DIM = 16
|
|
const N = 3
|
|
var vec = [DIM]float32{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16}
|
|
var rawData []byte
|
|
for _, ele := range vec {
|
|
buf := make([]byte, 4)
|
|
binary.LittleEndian.PutUint32(buf, math.Float32bits(ele))
|
|
rawData = append(rawData, buf...)
|
|
}
|
|
bs := make([]byte, 4)
|
|
binary.LittleEndian.PutUint32(bs, 1)
|
|
rawData = append(rawData, bs...)
|
|
var records []*commonpb.Blob
|
|
for i := 0; i < N; i++ {
|
|
blob := &commonpb.Blob{
|
|
Value: rawData,
|
|
}
|
|
records = append(records, blob)
|
|
}
|
|
|
|
var offset = segment.segmentPreInsert(N)
|
|
assert.GreaterOrEqual(t, offset, int64(0))
|
|
|
|
err := segment.segmentInsert(offset, &ids, ×tamps, &records)
|
|
assert.NoError(t, err)
|
|
|
|
var memSize = segment.getMemSize()
|
|
assert.Equal(t, memSize, int64(2785280))
|
|
|
|
deleteSegment(segment)
|
|
deleteCollection(collection)
|
|
}
|
|
|
|
//-------------------------------------------------------------------------------------- dm & search functions
|
|
func TestSegment_segmentInsert(t *testing.T) {
|
|
fieldVec := schemapb.FieldSchema{
|
|
Name: "vec",
|
|
DataType: schemapb.DataType_VECTOR_FLOAT,
|
|
TypeParams: []*commonpb.KeyValuePair{
|
|
{
|
|
Key: "dim",
|
|
Value: "16",
|
|
},
|
|
},
|
|
}
|
|
|
|
fieldInt := schemapb.FieldSchema{
|
|
Name: "age",
|
|
DataType: schemapb.DataType_INT32,
|
|
TypeParams: []*commonpb.KeyValuePair{
|
|
{
|
|
Key: "dim",
|
|
Value: "1",
|
|
},
|
|
},
|
|
}
|
|
|
|
schema := schemapb.CollectionSchema{
|
|
Name: "collection0",
|
|
Fields: []*schemapb.FieldSchema{
|
|
&fieldVec, &fieldInt,
|
|
},
|
|
}
|
|
|
|
collectionMeta := etcdpb.CollectionMeta{
|
|
ID: UniqueID(0),
|
|
Schema: &schema,
|
|
CreateTime: Timestamp(0),
|
|
SegmentIDs: []UniqueID{0},
|
|
PartitionTags: []string{"default"},
|
|
}
|
|
|
|
collectionMetaBlob := proto.MarshalTextString(&collectionMeta)
|
|
assert.NotEqual(t, "", collectionMetaBlob)
|
|
|
|
collection := newCollection(&collectionMeta, collectionMetaBlob)
|
|
assert.Equal(t, collection.meta.Schema.Name, "collection0")
|
|
assert.Equal(t, collection.meta.ID, UniqueID(0))
|
|
|
|
segmentID := UniqueID(0)
|
|
segment := newSegment(collection, segmentID)
|
|
assert.Equal(t, segmentID, segment.segmentID)
|
|
|
|
ids := []int64{1, 2, 3}
|
|
timestamps := []uint64{0, 0, 0}
|
|
|
|
const DIM = 16
|
|
const N = 3
|
|
var vec = [DIM]float32{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16}
|
|
var rawData []byte
|
|
for _, ele := range vec {
|
|
buf := make([]byte, 4)
|
|
binary.LittleEndian.PutUint32(buf, math.Float32bits(ele))
|
|
rawData = append(rawData, buf...)
|
|
}
|
|
bs := make([]byte, 4)
|
|
binary.LittleEndian.PutUint32(bs, 1)
|
|
rawData = append(rawData, bs...)
|
|
var records []*commonpb.Blob
|
|
for i := 0; i < N; i++ {
|
|
blob := &commonpb.Blob{
|
|
Value: rawData,
|
|
}
|
|
records = append(records, blob)
|
|
}
|
|
|
|
var offset = segment.segmentPreInsert(N)
|
|
assert.GreaterOrEqual(t, offset, int64(0))
|
|
|
|
err := segment.segmentInsert(offset, &ids, ×tamps, &records)
|
|
assert.NoError(t, err)
|
|
deleteSegment(segment)
|
|
deleteCollection(collection)
|
|
}
|
|
|
|
func TestSegment_segmentDelete(t *testing.T) {
|
|
fieldVec := schemapb.FieldSchema{
|
|
Name: "vec",
|
|
DataType: schemapb.DataType_VECTOR_FLOAT,
|
|
TypeParams: []*commonpb.KeyValuePair{
|
|
{
|
|
Key: "dim",
|
|
Value: "16",
|
|
},
|
|
},
|
|
}
|
|
|
|
fieldInt := schemapb.FieldSchema{
|
|
Name: "age",
|
|
DataType: schemapb.DataType_INT32,
|
|
TypeParams: []*commonpb.KeyValuePair{
|
|
{
|
|
Key: "dim",
|
|
Value: "1",
|
|
},
|
|
},
|
|
}
|
|
|
|
schema := schemapb.CollectionSchema{
|
|
Name: "collection0",
|
|
Fields: []*schemapb.FieldSchema{
|
|
&fieldVec, &fieldInt,
|
|
},
|
|
}
|
|
|
|
collectionMeta := etcdpb.CollectionMeta{
|
|
ID: UniqueID(0),
|
|
Schema: &schema,
|
|
CreateTime: Timestamp(0),
|
|
SegmentIDs: []UniqueID{0},
|
|
PartitionTags: []string{"default"},
|
|
}
|
|
|
|
collectionMetaBlob := proto.MarshalTextString(&collectionMeta)
|
|
assert.NotEqual(t, "", collectionMetaBlob)
|
|
|
|
collection := newCollection(&collectionMeta, collectionMetaBlob)
|
|
assert.Equal(t, collection.meta.Schema.Name, "collection0")
|
|
assert.Equal(t, collection.meta.ID, UniqueID(0))
|
|
|
|
segmentID := UniqueID(0)
|
|
segment := newSegment(collection, segmentID)
|
|
assert.Equal(t, segmentID, segment.segmentID)
|
|
|
|
ids := []int64{1, 2, 3}
|
|
timestamps := []uint64{0, 0, 0}
|
|
|
|
const DIM = 16
|
|
const N = 3
|
|
var vec = [DIM]float32{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16}
|
|
var rawData []byte
|
|
for _, ele := range vec {
|
|
buf := make([]byte, 4)
|
|
binary.LittleEndian.PutUint32(buf, math.Float32bits(ele))
|
|
rawData = append(rawData, buf...)
|
|
}
|
|
bs := make([]byte, 4)
|
|
binary.LittleEndian.PutUint32(bs, 1)
|
|
rawData = append(rawData, bs...)
|
|
var records []*commonpb.Blob
|
|
for i := 0; i < N; i++ {
|
|
blob := &commonpb.Blob{
|
|
Value: rawData,
|
|
}
|
|
records = append(records, blob)
|
|
}
|
|
|
|
var offsetInsert = segment.segmentPreInsert(N)
|
|
assert.GreaterOrEqual(t, offsetInsert, int64(0))
|
|
|
|
var err = segment.segmentInsert(offsetInsert, &ids, ×tamps, &records)
|
|
assert.NoError(t, err)
|
|
|
|
var offsetDelete = segment.segmentPreDelete(10)
|
|
assert.GreaterOrEqual(t, offsetDelete, int64(0))
|
|
|
|
err = segment.segmentDelete(offsetDelete, &ids, ×tamps)
|
|
assert.NoError(t, err)
|
|
|
|
deleteCollection(collection)
|
|
}
|
|
|
|
func TestSegment_segmentSearch(t *testing.T) {
|
|
ctx, cancel := context.WithCancel(context.Background())
|
|
defer cancel()
|
|
|
|
fieldVec := schemapb.FieldSchema{
|
|
Name: "vec",
|
|
DataType: schemapb.DataType_VECTOR_FLOAT,
|
|
TypeParams: []*commonpb.KeyValuePair{
|
|
{
|
|
Key: "dim",
|
|
Value: "16",
|
|
},
|
|
},
|
|
}
|
|
|
|
fieldInt := schemapb.FieldSchema{
|
|
Name: "age",
|
|
DataType: schemapb.DataType_INT32,
|
|
TypeParams: []*commonpb.KeyValuePair{
|
|
{
|
|
Key: "dim",
|
|
Value: "1",
|
|
},
|
|
},
|
|
}
|
|
|
|
schema := schemapb.CollectionSchema{
|
|
Name: "collection0",
|
|
Fields: []*schemapb.FieldSchema{
|
|
&fieldVec, &fieldInt,
|
|
},
|
|
}
|
|
|
|
collectionMeta := etcdpb.CollectionMeta{
|
|
ID: UniqueID(0),
|
|
Schema: &schema,
|
|
CreateTime: Timestamp(0),
|
|
SegmentIDs: []UniqueID{0},
|
|
PartitionTags: []string{"default"},
|
|
}
|
|
|
|
collectionMetaBlob := proto.MarshalTextString(&collectionMeta)
|
|
assert.NotEqual(t, "", collectionMetaBlob)
|
|
|
|
collection := newCollection(&collectionMeta, collectionMetaBlob)
|
|
assert.Equal(t, collection.meta.Schema.Name, "collection0")
|
|
assert.Equal(t, collection.meta.ID, UniqueID(0))
|
|
|
|
segmentID := UniqueID(0)
|
|
segment := newSegment(collection, segmentID)
|
|
assert.Equal(t, segmentID, segment.segmentID)
|
|
|
|
ids := []int64{1, 2, 3}
|
|
timestamps := []uint64{0, 0, 0}
|
|
|
|
const DIM = 16
|
|
const N = 3
|
|
var vec = [DIM]float32{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16}
|
|
var rawData []byte
|
|
for _, ele := range vec {
|
|
buf := make([]byte, 4)
|
|
binary.LittleEndian.PutUint32(buf, math.Float32bits(ele))
|
|
rawData = append(rawData, buf...)
|
|
}
|
|
bs := make([]byte, 4)
|
|
binary.LittleEndian.PutUint32(bs, 1)
|
|
rawData = append(rawData, bs...)
|
|
var records []*commonpb.Blob
|
|
for i := 0; i < N; i++ {
|
|
blob := &commonpb.Blob{
|
|
Value: rawData,
|
|
}
|
|
records = append(records, blob)
|
|
}
|
|
|
|
var offset = segment.segmentPreInsert(N)
|
|
assert.GreaterOrEqual(t, offset, int64(0))
|
|
|
|
err := segment.segmentInsert(offset, &ids, ×tamps, &records)
|
|
assert.NoError(t, err)
|
|
|
|
dslString := "{\"bool\": { \n\"vector\": {\n \"vec\": {\n \"metric_type\": \"L2\", \n \"params\": {\n \"nprobe\": 10 \n},\n \"query\": \"$0\",\"topk\": 10 \n } \n } \n } \n }"
|
|
|
|
pulsarURL, _ := Params.pulsarAddress()
|
|
const receiveBufSize = 1024
|
|
searchProducerChannels := Params.searchChannelNames()
|
|
searchStream := msgstream.NewPulsarMsgStream(ctx, receiveBufSize)
|
|
searchStream.SetPulsarClient(pulsarURL)
|
|
searchStream.CreatePulsarProducers(searchProducerChannels)
|
|
|
|
var searchRawData []byte
|
|
for _, ele := range vec {
|
|
buf := make([]byte, 4)
|
|
binary.LittleEndian.PutUint32(buf, math.Float32bits(ele))
|
|
searchRawData = append(searchRawData, buf...)
|
|
}
|
|
placeholderValue := servicepb.PlaceholderValue{
|
|
Tag: "$0",
|
|
Type: servicepb.PlaceholderType_VECTOR_FLOAT,
|
|
Values: [][]byte{searchRawData},
|
|
}
|
|
|
|
placeholderGroup := servicepb.PlaceholderGroup{
|
|
Placeholders: []*servicepb.PlaceholderValue{&placeholderValue},
|
|
}
|
|
|
|
placeHolderGroupBlob, err := proto.Marshal(&placeholderGroup)
|
|
if err != nil {
|
|
log.Print("marshal placeholderGroup failed")
|
|
}
|
|
|
|
searchTimestamp := Timestamp(1020)
|
|
cPlan := CreatePlan(*collection, dslString)
|
|
topK := cPlan.GetTopK()
|
|
cPlaceholderGroup := ParserPlaceholderGroup(cPlan, placeHolderGroupBlob)
|
|
placeholderGroups := make([]*PlaceholderGroup, 0)
|
|
placeholderGroups = append(placeholderGroups, cPlaceholderGroup)
|
|
|
|
var numQueries int64 = 0
|
|
for _, pg := range placeholderGroups {
|
|
numQueries += pg.GetNumOfQuery()
|
|
}
|
|
resultIds := make([]IntPrimaryKey, topK*numQueries)
|
|
resultDistances := make([]float32, topK*numQueries)
|
|
for i := range resultDistances {
|
|
resultDistances[i] = math.MaxFloat32
|
|
}
|
|
|
|
err = segment.segmentSearch(cPlan, placeholderGroups, []Timestamp{searchTimestamp}, resultIds, resultDistances, numQueries, topK)
|
|
assert.NoError(t, err)
|
|
|
|
deleteSegment(segment)
|
|
deleteCollection(collection)
|
|
}
|
|
|
|
//-------------------------------------------------------------------------------------- preDm functions
|
|
func TestSegment_segmentPreInsert(t *testing.T) {
|
|
fieldVec := schemapb.FieldSchema{
|
|
Name: "vec",
|
|
DataType: schemapb.DataType_VECTOR_FLOAT,
|
|
TypeParams: []*commonpb.KeyValuePair{
|
|
{
|
|
Key: "dim",
|
|
Value: "16",
|
|
},
|
|
},
|
|
}
|
|
|
|
fieldInt := schemapb.FieldSchema{
|
|
Name: "age",
|
|
DataType: schemapb.DataType_INT32,
|
|
TypeParams: []*commonpb.KeyValuePair{
|
|
{
|
|
Key: "dim",
|
|
Value: "1",
|
|
},
|
|
},
|
|
}
|
|
|
|
schema := schemapb.CollectionSchema{
|
|
Name: "collection0",
|
|
Fields: []*schemapb.FieldSchema{
|
|
&fieldVec, &fieldInt,
|
|
},
|
|
}
|
|
|
|
collectionMeta := etcdpb.CollectionMeta{
|
|
ID: UniqueID(0),
|
|
Schema: &schema,
|
|
CreateTime: Timestamp(0),
|
|
SegmentIDs: []UniqueID{0},
|
|
PartitionTags: []string{"default"},
|
|
}
|
|
|
|
collectionMetaBlob := proto.MarshalTextString(&collectionMeta)
|
|
assert.NotEqual(t, "", collectionMetaBlob)
|
|
|
|
collection := newCollection(&collectionMeta, collectionMetaBlob)
|
|
assert.Equal(t, collection.meta.Schema.Name, "collection0")
|
|
assert.Equal(t, collection.meta.ID, UniqueID(0))
|
|
|
|
segmentID := UniqueID(0)
|
|
segment := newSegment(collection, segmentID)
|
|
assert.Equal(t, segmentID, segment.segmentID)
|
|
|
|
const DIM = 16
|
|
const N = 3
|
|
var vec = [DIM]float32{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16}
|
|
var rawData []byte
|
|
for _, ele := range vec {
|
|
buf := make([]byte, 4)
|
|
binary.LittleEndian.PutUint32(buf, math.Float32bits(ele))
|
|
rawData = append(rawData, buf...)
|
|
}
|
|
bs := make([]byte, 4)
|
|
binary.LittleEndian.PutUint32(bs, 1)
|
|
rawData = append(rawData, bs...)
|
|
var records []*commonpb.Blob
|
|
for i := 0; i < N; i++ {
|
|
blob := &commonpb.Blob{
|
|
Value: rawData,
|
|
}
|
|
records = append(records, blob)
|
|
}
|
|
|
|
var offset = segment.segmentPreInsert(N)
|
|
assert.GreaterOrEqual(t, offset, int64(0))
|
|
|
|
deleteSegment(segment)
|
|
deleteCollection(collection)
|
|
}
|
|
|
|
func TestSegment_segmentPreDelete(t *testing.T) {
|
|
fieldVec := schemapb.FieldSchema{
|
|
Name: "vec",
|
|
DataType: schemapb.DataType_VECTOR_FLOAT,
|
|
TypeParams: []*commonpb.KeyValuePair{
|
|
{
|
|
Key: "dim",
|
|
Value: "16",
|
|
},
|
|
},
|
|
}
|
|
|
|
fieldInt := schemapb.FieldSchema{
|
|
Name: "age",
|
|
DataType: schemapb.DataType_INT32,
|
|
TypeParams: []*commonpb.KeyValuePair{
|
|
{
|
|
Key: "dim",
|
|
Value: "1",
|
|
},
|
|
},
|
|
}
|
|
|
|
schema := schemapb.CollectionSchema{
|
|
Name: "collection0",
|
|
Fields: []*schemapb.FieldSchema{
|
|
&fieldVec, &fieldInt,
|
|
},
|
|
}
|
|
|
|
collectionMeta := etcdpb.CollectionMeta{
|
|
ID: UniqueID(0),
|
|
Schema: &schema,
|
|
CreateTime: Timestamp(0),
|
|
SegmentIDs: []UniqueID{0},
|
|
PartitionTags: []string{"default"},
|
|
}
|
|
|
|
collectionMetaBlob := proto.MarshalTextString(&collectionMeta)
|
|
assert.NotEqual(t, "", collectionMetaBlob)
|
|
|
|
collection := newCollection(&collectionMeta, collectionMetaBlob)
|
|
assert.Equal(t, collection.meta.Schema.Name, "collection0")
|
|
assert.Equal(t, collection.meta.ID, UniqueID(0))
|
|
|
|
segmentID := UniqueID(0)
|
|
segment := newSegment(collection, segmentID)
|
|
assert.Equal(t, segmentID, segment.segmentID)
|
|
|
|
ids := []int64{1, 2, 3}
|
|
timestamps := []uint64{0, 0, 0}
|
|
|
|
const DIM = 16
|
|
const N = 3
|
|
var vec = [DIM]float32{1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16}
|
|
var rawData []byte
|
|
for _, ele := range vec {
|
|
buf := make([]byte, 4)
|
|
binary.LittleEndian.PutUint32(buf, math.Float32bits(ele))
|
|
rawData = append(rawData, buf...)
|
|
}
|
|
bs := make([]byte, 4)
|
|
binary.LittleEndian.PutUint32(bs, 1)
|
|
rawData = append(rawData, bs...)
|
|
var records []*commonpb.Blob
|
|
for i := 0; i < N; i++ {
|
|
blob := &commonpb.Blob{
|
|
Value: rawData,
|
|
}
|
|
records = append(records, blob)
|
|
}
|
|
|
|
var offsetInsert = segment.segmentPreInsert(N)
|
|
assert.GreaterOrEqual(t, offsetInsert, int64(0))
|
|
|
|
var err = segment.segmentInsert(offsetInsert, &ids, ×tamps, &records)
|
|
assert.NoError(t, err)
|
|
|
|
var offsetDelete = segment.segmentPreDelete(10)
|
|
assert.GreaterOrEqual(t, offsetDelete, int64(0))
|
|
|
|
deleteSegment(segment)
|
|
deleteCollection(collection)
|
|
}
|