-
Notifications
You must be signed in to change notification settings - Fork 665
/
conftest.py
133 lines (98 loc) · 3.88 KB
/
conftest.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
from __future__ import annotations
import logging
import os
import shutil
from collections.abc import Iterator
from pathlib import Path
from typing import Any
from unittest.mock import patch
import pytest
from dotenv import load_dotenv
from paperqa.clients.crossref import CROSSREF_HEADER_KEY
from paperqa.clients.semantic_scholar import SEMANTIC_SCHOLAR_HEADER_KEY
from paperqa.settings import Settings
from paperqa.types import PQASession
from paperqa.utils import setup_default_logs
TESTS_DIR = Path(__file__).parent
CASSETTES_DIR = TESTS_DIR / "cassettes"
@pytest.fixture(autouse=True, scope="session")
def _load_env() -> None:
load_dotenv()
@pytest.fixture(autouse=True)
def _setup_default_logs() -> None:
setup_default_logs()
OPENAI_API_KEY_HEADER = "authorization"
ANTHROPIC_API_KEY_HEADER = "x-api-key"
# SEE: https://github.com/kevin1024/vcrpy/blob/v6.0.1/vcr/config.py#L43
VCR_DEFAULT_MATCH_ON = "method", "scheme", "host", "port", "path", "query"
@pytest.fixture(scope="session", name="vcr_config")
def fixture_vcr_config() -> dict[str, Any]:
return {
"filter_headers": [
CROSSREF_HEADER_KEY,
SEMANTIC_SCHOLAR_HEADER_KEY,
OPENAI_API_KEY_HEADER,
ANTHROPIC_API_KEY_HEADER,
"cookie",
],
"record_mode": "once",
"allow_playback_repeats": True,
"cassette_library_dir": str(CASSETTES_DIR),
}
@pytest.fixture
def tmp_path_cleanup(tmp_path: Path) -> Iterator[Path]:
yield tmp_path
# Cleanup after the test
if tmp_path.exists():
shutil.rmtree(tmp_path, ignore_errors=True)
@pytest.fixture
def agent_home_dir(tmp_path_cleanup: str | os.PathLike) -> Iterator[str | os.PathLike]:
"""Set up a unique temporary folder for the agent module."""
with patch.dict("os.environ", {"PQA_HOME": str(tmp_path_cleanup)}):
yield tmp_path_cleanup
@pytest.fixture
def agent_index_dir(agent_home_dir: Path) -> Path:
return agent_home_dir / ".pqa" / "indexes"
@pytest.fixture(scope="session", name="stub_data_dir")
def fixture_stub_data_dir() -> Path:
return Path(__file__).parent / "stub_data"
@pytest.fixture
def agent_test_settings(agent_index_dir: Path, stub_data_dir: Path) -> Settings:
# NOTE: originally here we had usage of embedding="sparse", but this was
# shown to be too crappy of an embedding to get past the Obama article
settings = Settings()
settings.agent.index.paper_directory = stub_data_dir
settings.agent.index.index_directory = agent_index_dir
settings.agent.search_count = 2
settings.answer.answer_max_sources = 2
settings.answer.evidence_k = 10
return settings
@pytest.fixture
def agent_stub_session() -> PQASession:
return PQASession(question="What is is a self-explanatory model?")
@pytest.fixture
def stub_data_dir_w_near_dupes(stub_data_dir: Path, tmp_path: Path) -> Iterator[Path]:
# add some near duplicate files then removes them after testing
for filename in ("bates.txt", "obama.txt"):
if not (tmp_path / f"{filename}_modified.txt").exists():
with (stub_data_dir / filename).open() as f:
content = f.read()
with (tmp_path / f"{Path(filename).stem}_modified.txt").open("w") as f:
f.write(content)
f.write("## MODIFIED FOR HASH")
yield tmp_path
if tmp_path.exists():
shutil.rmtree(tmp_path, ignore_errors=True)
@pytest.fixture(name="reset_log_levels")
def fixture_reset_log_levels(caplog) -> Iterator[None]:
logging.getLogger().setLevel(logging.DEBUG)
for name in logging.root.manager.loggerDict:
logger = logging.getLogger(name)
logger.setLevel(logging.DEBUG)
logger.propagate = True
caplog.set_level(logging.DEBUG)
yield
for name in logging.root.manager.loggerDict:
logger = logging.getLogger(name)
logger.setLevel(logging.NOTSET)
logger.propagate = True