ocrag/tests/unit/test_embedder.py

29 lines
722 B
Python

import pytest
from ocrag.embedder import Embedder
@pytest.fixture(scope="module")
def embedder():
return Embedder()
def test_embedder_singleton(embedder):
embedder2 = Embedder()
assert embedder is embedder2
def test_embed_single(embedder):
vector = embedder.embed_single("Test sentence")
assert len(vector) == 1024 # Qwen3-Embedding-0.6B output dimension
assert isinstance(vector[0], float)
def test_embed_batch(embedder):
vectors = embedder.embed(["Sentence 1", "Sentence 2"])
assert len(vectors) == 2
assert len(vectors[0]) == 1024
assert len(vectors[1]) == 1024
assert (
vectors[0] != vectors[1]
) # Different sentences should have different embeddings