import asyncio
import random
from actian_vectorai import AsyncVectorAIClient, VectorParams, Distance, PointStruct, distribution_based_score_fusion
COLLECTION = "documents"
DIMENSION = 128
async def main():
async with AsyncVectorAIClient("localhost:50051") as client:
# Create collection if it doesn't exist
if not await client.collections.exists(COLLECTION):
await client.collections.create(
COLLECTION,
vectors_config=VectorParams(size=DIMENSION, distance=Distance.Cosine)
)
# Insert sample points
points = [
PointStruct(
id=i,
vector=[random.gauss(0, 1) for _ in range(DIMENSION)],
payload={
"text": f"Document {i} about {['AI', 'ML', 'NLP', 'CV'][i % 4]}",
"title": f"Article {i}"
}
)
for i in range(1, 101)
]
await client.points.upsert(COLLECTION, points)
print(f"✓ Inserted {len(points)} points")
# Multiple search queries with different characteristics
semantic_query = [random.gauss(0, 1) for _ in range(DIMENSION)]
keyword_query = [random.gauss(0.5, 0.8) for _ in range(DIMENSION)]
# Perform searches
semantic_results = await client.points.search(
COLLECTION,
vector=semantic_query,
limit=20
)
keyword_results = await client.points.search(
COLLECTION,
vector=keyword_query,
limit=20
)
# Fuse with weights (semantic search weighted higher)
print("DBSF fusion")
fused_results = distribution_based_score_fusion(
[semantic_results, keyword_results],
limit=10
)
for i, point in enumerate(fused_results[:5], 1):
print(f"{i}. ID: {point.id}, Fused Score: {point.score:.4f}")
if point.payload:
print(f" Title: {point.payload.get('title', 'N/A')}")
asyncio.run(main())