Skip to content

Commit

Permalink
Modifies tests and workflow to handle optional component.
Browse files Browse the repository at this point in the history
  • Loading branch information
alanmeeson committed Mar 30, 2024
1 parent f31181e commit 3248e36
Show file tree
Hide file tree
Showing 2 changed files with 79 additions and 38 deletions.
8 changes: 4 additions & 4 deletions .github/workflows/test.yml
Original file line number Diff line number Diff line change
Expand Up @@ -23,13 +23,13 @@ jobs:
strategy:
fail-fast: false
matrix:
os: [ubuntu-latest, macos-latest]
os: [ubuntu-latest, macos-latest, windows-latest]
python-version: ['3.9', '3.10']
exclude:
- os: macos-latest
python-version: '3.9'

steps:
- name: Install sqlite-vss on linux
if: matrix.os == 'ubuntu-latest'
run: pip install sqlite-vss
- name: Support longpaths
if: matrix.os == 'windows-latest'
run: git config --system core.longpaths true
Expand Down
109 changes: 75 additions & 34 deletions tests/test_embedding_retriever.py
Original file line number Diff line number Diff line change
@@ -1,44 +1,72 @@
# SPDX-FileCopyrightText: 2024-present Alan Meeson <am@carefullycalculated.co.uk>
#
# SPDX-License-Identifier: Apache-2.0
import pytest
from haystack.dataclasses import Document

from sqlite_haystack.document_store import SQLiteDocumentStore
from sqlite_haystack.embedding_retriever import SQLiteVSSEmbeddingRetriever


# TODO: see if there's a cleaner way of testing an optional package that won't be available on all environments

def test_init_default():
try:
import sqlite_vss
do_test = True
except ImportError:
do_test = False

store = SQLiteDocumentStore(":memory:")
retriever = SQLiteVSSEmbeddingRetriever(document_store=store)
assert retriever._document_store == store
assert retriever._filters == {}
assert retriever._top_k == 10
assert retriever._num_candidates == 100
if do_test:
# If we can import sqlite-vss we test the component
retriever = SQLiteVSSEmbeddingRetriever(document_store=store)
assert retriever._document_store == store
assert retriever._filters == {}
assert retriever._top_k == 10
assert retriever._num_candidates == 100
else:
# If we can't then we test the "This optional component is disabled" logic
with pytest.raises(NotImplemented):
retriever = SQLiteVSSEmbeddingRetriever(document_store=store)


def test_to_dict():
document_store = SQLiteDocumentStore(":memory:")
retriever = SQLiteVSSEmbeddingRetriever(document_store=document_store, num_candidates=50, embedding_dims=2)
res = retriever.to_dict()
try:
import sqlite_vss
do_test = True
except ImportError:
do_test = False

assert res == {
"type": "sqlite_haystack.embedding_retriever.SQLiteVSSEmbeddingRetriever",
"init_parameters": {
"document_store": {
"init_parameters": {
"database": ":memory:",
if do_test:
document_store = SQLiteDocumentStore(":memory:")
retriever = SQLiteVSSEmbeddingRetriever(document_store=document_store, num_candidates=50, embedding_dims=2)
res = retriever.to_dict()

assert res == {
"type": "sqlite_haystack.embedding_retriever.SQLiteVSSEmbeddingRetriever",
"init_parameters": {
"document_store": {
"init_parameters": {
"database": ":memory:",
},
"type": "sqlite_haystack.document_store.SQLiteDocumentStore",
},
"type": "sqlite_haystack.document_store.SQLiteDocumentStore",
"filters": {},
"top_k": 10,
"num_candidates": 50,
"embedding_dims": 2,
},
"filters": {},
"top_k": 10,
"num_candidates": 50,
"embedding_dims": 2,
},
}
}


def test_from_dict():
try:
import sqlite_vss
expect_not_implemented = False
except ImportError:
expect_not_implemented = True

data = {
"type": "sqlite_haystack.embedding_retriever.SQLiteVSSEmbeddingRetriever",
"init_parameters": {
Expand All @@ -52,20 +80,33 @@ def test_from_dict():
"embedding_dims": 2,
},
}
retriever = SQLiteVSSEmbeddingRetriever.from_dict(data)
assert retriever._document_store
assert retriever._filters == {}
assert retriever._top_k == 10
assert retriever._num_candidates == 50
assert retriever._embedding_dims == 2

if expect_not_implemented:
with pytest.raises(NotImplemented):
retriever = SQLiteVSSEmbeddingRetriever.from_dict(data)
else:
retriever = SQLiteVSSEmbeddingRetriever.from_dict(data)
assert retriever._document_store
assert retriever._filters == {}
assert retriever._top_k == 10
assert retriever._num_candidates == 50
assert retriever._embedding_dims == 2


def test_run():
store = SQLiteDocumentStore(":memory:")
retriever = SQLiteVSSEmbeddingRetriever(document_store=store, embedding_dims=2)
store.write_documents([Document(content="Test doc", embedding=[0.5, 0.7])])
res = retriever.run(query_embedding=[0.5, 0.7])
try:
import sqlite_vss
do_test = True
except ImportError:
do_test = False

if do_test:
store = SQLiteDocumentStore(":memory:")
retriever = SQLiteVSSEmbeddingRetriever(document_store=store, embedding_dims=2)
store.write_documents([Document(content="Test doc", embedding=[0.5, 0.7])])
res = retriever.run(query_embedding=[0.5, 0.7])

assert len(res) == 1
assert len(res["documents"]) == 1
assert res["documents"][0].content == "Test doc"

assert len(res) == 1
assert len(res["documents"]) == 1
assert res["documents"][0].content == "Test doc"

0 comments on commit 3248e36

Please sign in to comment.