hellocomputer/test/test_query.py
Guillem Borrell 495c22e0de
Some checks failed
ci/woodpecker/push/woodpecker Pipeline failed
Removed sensitive api key
2024-07-13 11:53:37 +02:00

68 lines
2.1 KiB
Python

from pathlib import Path
import hellocomputer
import pytest
import polars as pl
from hellocomputer.config import settings
from hellocomputer.db import StorageEngines
from hellocomputer.extraction import extract_code_block
from hellocomputer.models import Chat
from hellocomputer.db.sessions import SessionDB
TEST_STORAGE = StorageEngines.local
TEST_OUTPUT_FOLDER = Path(hellocomputer.__file__).parents[2] / "test" / "output"
TEST_XLS_PATH = (
Path(hellocomputer.__file__).parents[2]
/ "test"
/ "data"
/ "TestExcelHelloComputer.xlsx"
)
SID = "test"
@pytest.mark.asyncio
@pytest.mark.skipif(settings.llm_api_key == "Awesome API", reason="API Key not set")
async def test_chat_simple():
chat = Chat(api_key=settings.llm_api_key, temperature=0)
chat = await chat.eval("Say literlly 'Hello'")
assert "Hello" in chat.last_response_content()
@pytest.mark.asyncio
@pytest.mark.skipif(settings.llm_api_key == "Awesome API", reason="API Key not set")
async def test_simple_data_query():
query = "write a query that finds the average score of all students in the current database"
chat = Chat(
api_key=settings.llm_api_key,
temperature=0.5,
)
db = SessionDB(
storage_engine=StorageEngines.local, path=TEST_XLS_PATH.parent, sid=SID
).load_xls(TEST_XLS_PATH)
chat = await chat.sql_eval(db.query_prompt(query))
query = extract_code_block(chat.last_response_content())
assert query.startswith("SELECT")
@pytest.mark.asyncio
@pytest.mark.skipif(settings.llm_api_key == "Awesome API", reason="API Key not set")
async def test_data_query():
q = "Find the average score of all the sudents"
llm = Chat(
api_key=settings.llm_api_key,
temperature=0.5,
)
db = SessionDB(
storage_engine=TEST_STORAGE, path=TEST_OUTPUT_FOLDER, sid="test"
).load_folder()
chat = await llm.sql_eval(db.query_prompt(q))
query = extract_code_block(chat.last_response_content())
result: pl.DataFrame = db.query(query).pl()
assert result.shape[0] == 1
assert result.select([pl.col("avg(Score)")]).to_series()[0] == 0.5