2021-10-15 17:48:42 +08:00
|
|
|
import pytest
|
2021-10-22 14:37:21 +08:00
|
|
|
import time
|
2021-10-15 17:48:42 +08:00
|
|
|
|
|
|
|
from pymilvus import connections
|
|
|
|
from utils.util_log import test_log as log
|
2021-10-21 20:19:28 +08:00
|
|
|
from base.collection_wrapper import ApiCollectionWrapper
|
|
|
|
from common import common_func as cf
|
|
|
|
from common import common_type as ct
|
2021-10-22 14:37:21 +08:00
|
|
|
from milvus_operator import MilvusOperator
|
|
|
|
from common.milvus_sys import MilvusSys
|
|
|
|
from common.common_type import CaseLabel
|
2021-10-15 17:48:42 +08:00
|
|
|
|
2021-11-12 19:11:12 +08:00
|
|
|
# sorted by the priority order of the simd
|
|
|
|
# | configuration | possible returned SIMD |
|
|
|
|
# |--------|----------|
|
|
|
|
# | auto | avx512 / avx2 / sse4_2|
|
|
|
|
# | avx512 | avx512 / avx2 / sse4_2|
|
|
|
|
# | avx2 | avx2 / sse4_2|
|
|
|
|
# | avx | sse4_2|
|
|
|
|
# | sse4_2 | sse4_2|
|
|
|
|
supported_simd_types = ["avx512", "avx2", "avx", "sse4_2"]
|
2021-11-05 14:49:07 +08:00
|
|
|
namespace = 'chaos-testing'
|
|
|
|
|
|
|
|
|
|
|
|
def _install_milvus(simd):
|
|
|
|
release_name = f"mil-{simd.replace('_','-')}-" + cf.gen_digits_by_length(6)
|
2023-10-25 17:20:14 +08:00
|
|
|
cus_configs = {'spec.components.image': 'harbor.milvus.io/milvus/milvus:master-latest',
|
2021-11-05 14:49:07 +08:00
|
|
|
'metadata.namespace': namespace,
|
|
|
|
'metadata.name': release_name,
|
2023-10-25 17:20:14 +08:00
|
|
|
'spec.config.common.simdType': simd
|
2021-11-05 14:49:07 +08:00
|
|
|
}
|
|
|
|
milvus_op = MilvusOperator()
|
|
|
|
log.info(f"install milvus with configs: {cus_configs}")
|
|
|
|
milvus_op.install(cus_configs)
|
2021-11-11 13:26:54 +08:00
|
|
|
healthy = milvus_op.wait_for_healthy(release_name, namespace, timeout=1200)
|
2021-11-05 14:49:07 +08:00
|
|
|
log.info(f"milvus healthy: {healthy}")
|
|
|
|
if healthy:
|
|
|
|
endpoint = milvus_op.endpoint(release_name, namespace).split(':')
|
|
|
|
log.info(f"milvus endpoint: {endpoint}")
|
|
|
|
host = endpoint[0]
|
|
|
|
port = endpoint[1]
|
|
|
|
return release_name, host, port
|
|
|
|
else:
|
|
|
|
return release_name, None, None
|
2021-10-15 17:48:42 +08:00
|
|
|
|
|
|
|
|
2021-10-22 14:37:21 +08:00
|
|
|
class TestSimdCompatibility:
|
2021-11-05 14:49:07 +08:00
|
|
|
|
|
|
|
def teardown_method(self):
|
|
|
|
milvus_op = MilvusOperator()
|
2021-11-11 13:26:54 +08:00
|
|
|
milvus_op.uninstall(self.release_name, namespace)
|
2021-11-05 14:49:07 +08:00
|
|
|
|
2021-10-22 14:37:21 +08:00
|
|
|
@pytest.mark.tags(CaseLabel.L3)
|
2023-10-25 17:20:14 +08:00
|
|
|
@pytest.mark.parametrize('simd', supported_simd_types)
|
|
|
|
def test_simd_compat_e2e(self, simd):
|
2021-11-08 10:19:13 +08:00
|
|
|
"""
|
|
|
|
steps
|
|
|
|
1. [test_milvus_install]: set up milvus with customized simd configured
|
|
|
|
2. [test_simd_compat_e2e]: verify milvus is working well
|
|
|
|
4. [test_milvus_cleanup]: delete milvus instances in teardown
|
|
|
|
"""
|
2021-11-05 14:49:07 +08:00
|
|
|
log.info(f"start to install milvus with simd {simd}")
|
|
|
|
release_name, host, port = _install_milvus(simd)
|
2023-10-25 17:20:14 +08:00
|
|
|
time.sleep(10)
|
2021-11-11 13:26:54 +08:00
|
|
|
self.release_name = release_name
|
2021-11-05 14:49:07 +08:00
|
|
|
assert host is not None
|
|
|
|
conn = connections.connect("default", host=host, port=port)
|
2021-10-22 14:37:21 +08:00
|
|
|
assert conn is not None
|
2021-11-05 14:49:07 +08:00
|
|
|
mil = MilvusSys(alias="default")
|
2021-10-22 14:37:21 +08:00
|
|
|
log.info(f"milvus build version: {mil.build_version}")
|
2021-11-05 14:49:07 +08:00
|
|
|
log.info(f"milvus simdType: {mil.simd_type}")
|
2023-10-25 17:20:14 +08:00
|
|
|
assert str(mil.simd_type).lower() == simd.lower()
|
2021-10-22 14:37:21 +08:00
|
|
|
|
|
|
|
log.info(f"start to e2e verification: {simd}")
|
|
|
|
# create
|
2023-10-25 17:20:14 +08:00
|
|
|
prefix = "simd_"
|
|
|
|
name = cf.gen_unique_str(prefix)
|
2021-10-22 14:37:21 +08:00
|
|
|
t0 = time.time()
|
|
|
|
collection_w = ApiCollectionWrapper()
|
2023-10-25 17:20:14 +08:00
|
|
|
collection_w.init_collection_wrap(name=name)
|
2021-10-22 14:37:21 +08:00
|
|
|
tt = time.time() - t0
|
|
|
|
assert collection_w.name == name
|
|
|
|
entities = collection_w.num_entities
|
|
|
|
log.info(f"assert create collection: {tt}, init_entities: {entities}")
|
|
|
|
|
|
|
|
# insert
|
2023-10-25 17:20:14 +08:00
|
|
|
for _ in range(10):
|
|
|
|
data = cf.gen_default_list_data(nb=300)
|
|
|
|
t0 = time.time()
|
|
|
|
_, res = collection_w.insert(data)
|
|
|
|
tt = time.time() - t0
|
|
|
|
log.info(f"assert insert: {tt}")
|
|
|
|
assert res
|
2021-10-22 14:37:21 +08:00
|
|
|
|
|
|
|
# flush
|
|
|
|
t0 = time.time()
|
2023-10-25 17:20:14 +08:00
|
|
|
_, check_result = collection_w.flush(timeout=180)
|
|
|
|
assert check_result
|
2021-10-22 14:37:21 +08:00
|
|
|
assert collection_w.num_entities == len(data[0]) + entities
|
|
|
|
tt = time.time() - t0
|
|
|
|
entities = collection_w.num_entities
|
|
|
|
log.info(f"assert flush: {tt}, entities: {entities}")
|
|
|
|
|
2023-10-25 17:20:14 +08:00
|
|
|
# index
|
|
|
|
index_params = {"index_type": "IVF_SQ8", "params": {"nlist": 64}, "metric_type": "L2"}
|
|
|
|
t0 = time.time()
|
|
|
|
index, _ = collection_w.create_index(field_name=ct.default_float_vec_field_name,
|
|
|
|
index_params=index_params,
|
|
|
|
index_name=cf.gen_unique_str())
|
|
|
|
index, _ = collection_w.create_index(field_name=ct.default_string_field_name,
|
|
|
|
index_params={},
|
|
|
|
index_name=cf.gen_unique_str())
|
|
|
|
tt = time.time() - t0
|
|
|
|
log.info(f"assert index: {tt}")
|
|
|
|
assert len(collection_w.indexes) == 2
|
|
|
|
|
|
|
|
# load
|
2021-10-22 14:37:21 +08:00
|
|
|
collection_w.load()
|
2023-10-25 17:20:14 +08:00
|
|
|
|
|
|
|
# search
|
2021-10-22 14:37:21 +08:00
|
|
|
search_vectors = cf.gen_vectors(1, ct.default_dim)
|
|
|
|
search_params = {"metric_type": "L2", "params": {"nprobe": 16}}
|
|
|
|
t0 = time.time()
|
|
|
|
res_1, _ = collection_w.search(data=search_vectors,
|
|
|
|
anns_field=ct.default_float_vec_field_name,
|
|
|
|
param=search_params, limit=1)
|
|
|
|
tt = time.time() - t0
|
|
|
|
log.info(f"assert search: {tt}")
|
|
|
|
assert len(res_1) == 1
|
2023-10-25 17:20:14 +08:00
|
|
|
|
|
|
|
# release
|
2021-10-22 14:37:21 +08:00
|
|
|
collection_w.release()
|
|
|
|
|
2023-10-25 17:20:14 +08:00
|
|
|
# insert
|
2021-10-22 14:37:21 +08:00
|
|
|
d = cf.gen_default_list_data()
|
|
|
|
collection_w.insert(d)
|
|
|
|
|
|
|
|
# search
|
|
|
|
t0 = time.time()
|
|
|
|
collection_w.load()
|
|
|
|
tt = time.time() - t0
|
|
|
|
log.info(f"assert load: {tt}")
|
2023-10-25 17:20:14 +08:00
|
|
|
nq = 5
|
|
|
|
topk = 5
|
|
|
|
search_vectors = cf.gen_vectors(nq, ct.default_dim)
|
2021-10-22 14:37:21 +08:00
|
|
|
t0 = time.time()
|
2023-10-25 17:20:14 +08:00
|
|
|
res, _ = collection_w.search(data=search_vectors,
|
|
|
|
anns_field=ct.default_float_vec_field_name,
|
|
|
|
param=search_params, limit=topk)
|
2021-10-22 14:37:21 +08:00
|
|
|
tt = time.time() - t0
|
|
|
|
log.info(f"assert search: {tt}")
|
2023-10-25 17:20:14 +08:00
|
|
|
assert len(res) == nq
|
|
|
|
assert len(res[0]) <= topk
|
2021-10-22 14:37:21 +08:00
|
|
|
# query
|
2023-10-25 17:20:14 +08:00
|
|
|
term_expr = f'{ct.default_int64_field_name} in [1, 2, 3, 4]'
|
2021-10-22 14:37:21 +08:00
|
|
|
t0 = time.time()
|
|
|
|
res, _ = collection_w.query(term_expr)
|
|
|
|
tt = time.time() - t0
|
|
|
|
log.info(f"assert query result {len(res)}: {tt}")
|
2023-10-25 17:20:14 +08:00
|
|
|
assert len(res) >= 4
|
|
|
|
|