29 lines
722 B
Python
29 lines
722 B
Python
import pytest
|
|
from ocrag.embedder import Embedder
|
|
|
|
|
|
@pytest.fixture(scope="module")
|
|
def embedder():
|
|
return Embedder()
|
|
|
|
|
|
def test_embedder_singleton(embedder):
|
|
embedder2 = Embedder()
|
|
assert embedder is embedder2
|
|
|
|
|
|
def test_embed_single(embedder):
|
|
vector = embedder.embed_single("Test sentence")
|
|
assert len(vector) == 1024 # Qwen3-Embedding-0.6B output dimension
|
|
assert isinstance(vector[0], float)
|
|
|
|
|
|
def test_embed_batch(embedder):
|
|
vectors = embedder.embed(["Sentence 1", "Sentence 2"])
|
|
assert len(vectors) == 2
|
|
assert len(vectors[0]) == 1024
|
|
assert len(vectors[1]) == 1024
|
|
assert (
|
|
vectors[0] != vectors[1]
|
|
) # Different sentences should have different embeddings
|