colibri.qdrant / tests /openapi /test_optional_vectors.py
Gouzi Mohaled
Ajout du dossier tests
3932407
import pytest
from .helpers.collection_setup import drop_collection, multivec_collection_setup
from .helpers.helpers import request_with_validation
@pytest.fixture(autouse=True)
def setup(on_disk_vectors, on_disk_payload, collection_name):
multivec_collection_setup(collection_name=collection_name, on_disk_vectors=on_disk_vectors, on_disk_payload=on_disk_payload, distance='Dot')
yield
drop_collection(collection_name=collection_name)
def compare_vectors(v1, v2):
if len(v1) != len(v2):
return False
for i in range(len(v1)):
if abs(v1[i] - v2[i]) > 1e-5:
return False
return True
def test_delete_and_search(collection_name):
response = request_with_validation(
api='/collections/{collection_name}/points/vectors/delete',
method="POST",
path_params={'collection_name': collection_name},
body={
"points": [2, 3],
"vector": ["text"]
}
)
assert response.ok
response = request_with_validation(
api='/collections/{collection_name}/points/search',
method="POST",
path_params={'collection_name': collection_name},
body={
"vector": {
"name": "image",
"vector": [0.0, 0.0, 1.0, 1.0]
},
"limit": 10,
"with_payload": True,
"with_vector": ["text"],
}
)
assert response.ok
def test_retrieve_deleted_vector(collection_name):
# Delete vector
response = request_with_validation(
api='/collections/{collection_name}/points/vectors/delete',
method="POST",
path_params={'collection_name': collection_name},
body={
"points": [1, 3],
"vector": ["text"]
}
)
assert response.ok
# Retrieve deleted vector
response = request_with_validation(
api='/collections/{collection_name}/points',
method="POST",
path_params={'collection_name': collection_name},
body={
"ids": [1, 2, 3, 4],
"with_vectors": ["text", "image"],
"with_payload": True,
}
)
assert response.ok
result = response.json()["result"]
assert len(result) == 4
id_to_result = {r["id"]: r for r in result}
assert id_to_result[1]["vector"].get("image") is not None
assert id_to_result[1]["vector"].get("text") is None
assert id_to_result[2]["vector"].get("image") is not None
assert id_to_result[2]["vector"].get("text") is not None
assert id_to_result[3]["vector"].get("image") is not None
assert id_to_result[3]["vector"].get("text") is None
assert id_to_result[4]["vector"].get("image") is not None
assert id_to_result[4]["vector"].get("text") is not None
def test_upsert_partial_vectors(collection_name):
response = request_with_validation(
api='/collections/{collection_name}/points',
method="PUT",
path_params={'collection_name': collection_name},
query_params={'wait': 'true'},
body={
"points": [
{
"id": 101,
"vector": {
"text": [0.05, 0.61, 0.76, 0.74, 0.05, 0.61, 0.76, 0.74],
},
"payload": {"city": "Berlin"}
},
{
"id": 102,
"vector": {
"image": [0.19, 0.81, 0.75, 0.11],
},
"payload": {"city": ["Berlin", "London"]}
},
{
"id": 103,
"vector": {},
"payload": {"city": ["Berlin", "Moscow"]}
},
]
}
)
assert response.ok
response = request_with_validation(
api='/collections/{collection_name}/points/{id}',
method="GET",
path_params={'collection_name': collection_name, 'id': 101},
)
assert response.ok
result = response.json()["result"]
assert result["id"] == 101
assert "image" not in result["vector"]
assert "text" in result["vector"]
response = request_with_validation(
api='/collections/{collection_name}/points/{id}',
method="GET",
path_params={'collection_name': collection_name, 'id': 102},
)
assert response.ok
result = response.json()["result"]
assert result["id"] == 102
assert "image" in result["vector"]
assert "text" not in result["vector"]
response = request_with_validation(
api='/collections/{collection_name}/points/{id}',
method="GET",
path_params={'collection_name': collection_name, 'id': 103},
)
assert response.ok
result = response.json()["result"]
assert result["id"] == 103
assert "image" not in result["vector"]
assert "text" not in result["vector"]
def test_update_vectors(collection_name):
POINT_ID = 1000
# Put empty vector first
response = request_with_validation(
api='/collections/{collection_name}/points',
method="PUT",
path_params={'collection_name': collection_name},
query_params={'wait': 'true'},
body={
"points": [
{
"id": POINT_ID,
"vector": {},
"payload": {"city": "Berlin"}
}
]
}
)
assert response.ok
response = request_with_validation(
api='/collections/{collection_name}/points/{id}',
method="GET",
path_params={'collection_name': collection_name, 'id': POINT_ID},
)
assert response.ok
result = response.json()["result"]
assert result["vector"].get("text") is None
text_vector = [
0.34035879, 0.344099,
0.3478392, 0.35157941,
0.35531961, 0.35905982,
0.36280003, 0.36654023
]
response = request_with_validation(
api='/collections/{collection_name}/points/vectors',
method="PUT",
path_params={'collection_name': collection_name},
query_params={'wait': 'true'},
body={
"points": [
{
"id": POINT_ID,
"vector": {
"text": text_vector,
}
}
]
}
)
assert response.ok
response = request_with_validation(
api='/collections/{collection_name}/points/{id}',
method="GET",
path_params={'collection_name': collection_name, 'id': POINT_ID},
)
assert response.ok
result = response.json()["result"]
assert compare_vectors(result["vector"]["text"], text_vector)
assert result["payload"]["city"] == "Berlin"
text_vector = [
0.07902951, 0.22391693,
0.36880436, 0.51369179,
0.59272129, 0.07902951,
0.22391693, 0.36880436
]
image_vector = [0.19, 0.28, 0.37, 0.46]
response = request_with_validation(
api='/collections/{collection_name}/points/vectors',
method="PUT",
path_params={'collection_name': collection_name},
query_params={'wait': 'true'},
body={
"points": [
{
"id": POINT_ID,
"vector": {
"text": text_vector,
"image": image_vector,
}
}
]
}
)
assert response.ok
response = request_with_validation(
api='/collections/{collection_name}/points/{id}',
method="GET",
path_params={'collection_name': collection_name, 'id': POINT_ID},
)
assert response.ok
result = response.json()["result"]
assert compare_vectors(result["vector"]["image"], image_vector)
assert compare_vectors(result["vector"]["text"], text_vector)
image_vector = [0.00, 0.01, 0.00, 0.01]
response = request_with_validation(
api='/collections/{collection_name}/points/vectors',
method="PUT",
path_params={'collection_name': collection_name},
query_params={'wait': 'true'},
body={
"points": [
{
"id": POINT_ID,
"vector": {
"image": image_vector,
}
}
]
}
)
assert response.ok
response = request_with_validation(
api='/collections/{collection_name}/points/{id}',
method="GET",
path_params={'collection_name': collection_name, 'id': POINT_ID},
)
assert response.ok
result = response.json()["result"]
assert compare_vectors(result["vector"]["image"], image_vector)
assert compare_vectors(result["vector"]["text"], text_vector)
def test_update_empty_vectors(collection_name):
"""
Remove all named vectors for a point. Then add named vectors and test
against it.
"""
response = request_with_validation(
api='/collections/{collection_name}/points/vectors/delete',
method="POST",
path_params={'collection_name': collection_name},
body={
"points": [1],
"vector": ["image", "text"]
}
)
assert response.ok
response = request_with_validation(
api='/collections/{collection_name}/points/{id}',
method="GET",
path_params={'collection_name': collection_name, 'id': 1},
)
assert response.ok
result = response.json()["result"]
assert "text" not in result["vector"]
assert "image" not in result["vector"]
text_vector = [
0.34035879, 0.344099,
0.3478392, 0.35157941,
0.35531961, 0.35905982,
0.36280003, 0.36654023
]
response = request_with_validation(
api='/collections/{collection_name}/points/vectors',
method="PUT",
path_params={'collection_name': collection_name},
query_params={'wait': 'true'},
body={
"points": [
{
"id": 1,
"vector": {
"text": text_vector,
}
}
]
}
)
assert response.ok
response = request_with_validation(
api='/collections/{collection_name}/points/{id}',
method="GET",
path_params={'collection_name': collection_name, 'id': 1},
)
assert response.ok
result = response.json()["result"]
assert compare_vectors(result["vector"]["text"], text_vector)
assert "image" not in result["vector"]
image_vector = [0.19, 0.28, 0.37, 0.46]
response = request_with_validation(
api='/collections/{collection_name}/points/vectors',
method="PUT",
path_params={'collection_name': collection_name},
query_params={'wait': 'true'},
body={
"points": [
{
"id": 1,
"vector": {
"image": image_vector,
}
}
]
}
)
assert response.ok
response = request_with_validation(
api='/collections/{collection_name}/points/{id}',
method="GET",
path_params={'collection_name': collection_name, 'id': 1},
)
assert response.ok
result = response.json()["result"]
assert compare_vectors(result["vector"]["image"], image_vector)
assert compare_vectors(result["vector"]["text"], text_vector)
def test_update_vectors_unknown_point(collection_name):
response = request_with_validation(
api='/collections/{collection_name}/points/vectors',
method="PUT",
path_params={'collection_name': collection_name},
query_params={'wait': 'true'},
body={
"points": [
{
"id": 1,
"vector": {
"text": [0.05, 0.61, 0.76, 0.74, 0.05, 0.61, 0.76, 0.74],
},
"payload": {"city": "Berlin"}
},
{
"id": 424242424242424242,
"vector": {
"image": [0.19, 0.81, 0.75, 0.11],
},
"payload": {"city": ["Berlin", "London"]}
}
]
}
)
assert not response.ok
assert response.status_code == 404
error = response.json()["status"]["error"]
assert error == "Not found: No point with id 424242424242424242 found"
def test_update_vectors_same_point_in_batch(collection_name):
POINT_ID = 1000
response = request_with_validation(
api='/collections/{collection_name}/points',
method="PUT",
path_params={'collection_name': collection_name},
query_params={'wait': 'true'},
body={
"points": [
{
"id": POINT_ID,
"vector": {
"text": [0.1, 0.3, 0.2, 0.9, 0.9, 0.1, 0.4, 0.9],
"image": [0.8, 0.6, 0.3, 0.0],
},
}
]
}
)
assert response.ok
response = request_with_validation(
api='/collections/{collection_name}/points/{id}',
method="GET",
path_params={'collection_name': collection_name, 'id': POINT_ID},
)
assert response.ok
result = response.json()["result"]
assert result["vector"].get("text") == [0.1, 0.3, 0.2, 0.9, 0.9, 0.1, 0.4, 0.9]
assert result["vector"].get("image") == [0.8, 0.6, 0.3, 0.0]
# Update both vectors in separate batch items
# Matches bug report: <https://github.com/qdrant/qdrant/issues/3376>
response = request_with_validation(
api='/collections/{collection_name}/points/vectors',
method="PUT",
path_params={'collection_name': collection_name},
query_params={'wait': 'true'},
body={
"points": [
{
"id": POINT_ID,
"vector": {
"text": [0.8, 0.8, 0.9, 0.2, 0.7, 0.5, 0.2, 0.6],
}
},
{
"id": POINT_ID,
"vector": {
"image": [0.3, 0.6, 0.4, 0.4],
}
}
]
}
)
assert response.ok
response = request_with_validation(
api='/collections/{collection_name}/points/{id}',
method="GET",
path_params={'collection_name': collection_name, 'id': POINT_ID},
)
assert response.ok
result = response.json()["result"]
assert result["vector"].get("text") == [0.8, 0.8, 0.9, 0.2, 0.7, 0.5, 0.2, 0.6]
assert result["vector"].get("image") == [0.3, 0.6, 0.4, 0.4]
# Update the same vector twice
response = request_with_validation(
api='/collections/{collection_name}/points/vectors',
method="PUT",
path_params={'collection_name': collection_name},
query_params={'wait': 'true'},
body={
"points": [
{
"id": POINT_ID,
"vector": {
"text": [0.2, 0.0, 0.1, 0.3, 0.1, 0.0, 0.0, 0.5],
}
},
{
"id": POINT_ID,
"vector": {
"image": [0.7, 0.5, 0.0, 0.5],
"text": [0.9, 0.2, 0.5, 0.6, 0.4, 0.1, 0.6, 0.7],
}
},
{
"id": 1,
"vector": {
"image": [0.4, 0.4, 0.0, 0.9],
"text": [0.8, 0.6, 0.9, 0.2, 0.3, 0.9, 0.5, 0.9],
}
},
{
"id": 2,
"vector": {
"text": [0.5, 0.8, 0.9, 0.8, 0.3, 0.2, 0.1, 0.1],
}
},
{
"id": 3,
"vector": {
"image": [0.1, 0.1, 0.3, 0.7],
}
},
{
"id": POINT_ID,
"vector": {
"image": [0.9, 0.9, 0.7, 0.5],
}
},
{
"id": POINT_ID,
"vector": {
"image": [0.4, 0.5, 0.6, 0.2],
}
},
]
}
)
assert response.ok
response = request_with_validation(
api='/collections/{collection_name}/points/{id}',
method="GET",
path_params={'collection_name': collection_name, 'id': POINT_ID},
)
assert response.ok
result = response.json()["result"]
assert result["vector"].get("text") == [0.9, 0.2, 0.5, 0.6, 0.4, 0.1, 0.6, 0.7]
assert result["vector"].get("image") == [0.4, 0.5, 0.6, 0.2]
def test_no_vectors(collection_name):
response = request_with_validation(
api='/collections/{collection_name}/points/vectors',
method="PUT",
path_params={'collection_name': collection_name},
query_params={'wait': 'true'},
body={
"points": [
{
"id": 1,
"vector": {},
}
]
}
)
assert not response.ok
assert response.status_code == 422
error = response.json()["status"]["error"]
assert error.__contains__(
"Validation error in JSON body: [points[0].vector: must specify vectors to update for point]")
def test_delete_vectors(collection_name):
delete_vectors(collection_name)
# Deleting a second time should work fine
delete_vectors(collection_name)
def delete_vectors(collection_name):
response = request_with_validation(
api='/collections/{collection_name}/points/vectors/delete',
method="POST",
path_params={'collection_name': collection_name},
body={
"points": [1, 2],
"vector": ["image"]
}
)
assert response.ok
response = request_with_validation(
api='/collections/{collection_name}/points/vectors/delete',
method="POST",
path_params={'collection_name': collection_name},
body={
"points": [2, 3],
"vector": ["text"]
}
)
assert response.ok
response = request_with_validation(
api='/collections/{collection_name}/points/{id}',
method="GET",
path_params={'collection_name': collection_name, 'id': 1},
)
assert response.ok
result = response.json()["result"]
assert "image" not in result["vector"]
assert "text" in result["vector"]
response = request_with_validation(
api='/collections/{collection_name}/points/{id}',
method="GET",
path_params={'collection_name': collection_name, 'id': 2},
)
assert response.ok
result = response.json()["result"]
assert "image" not in result["vector"]
assert "text" not in result["vector"]
response = request_with_validation(
api='/collections/{collection_name}/points/{id}',
method="GET",
path_params={'collection_name': collection_name, 'id': 3},
)
assert response.ok
result = response.json()["result"]
assert "image" in result["vector"]
assert "text" not in result["vector"]
def test_delete_all_vectors(collection_name):
response = request_with_validation(
api='/collections/{collection_name}/points/vectors/delete',
method="POST",
path_params={'collection_name': collection_name},
body={
"filter": {},
"vector": ["image", "text"]
}
)
assert response.ok
def test_delete_unknown_vectors(collection_name):
response = request_with_validation(
api='/collections/{collection_name}/points/vectors/delete',
method="POST",
path_params={'collection_name': collection_name},
query_params={'wait': 'true'},
body={
"points": [1, 2],
"vector": ["a"]
}
)
assert not response.ok
assert response.status_code == 400
error = response.json()["status"]["error"]
assert error.__contains__("Wrong input: Not existing vector name error: a")