forked from leonkuperman/llm_demo_news
-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathdb_setup.py
64 lines (55 loc) · 2.16 KB
/
db_setup.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
# db_setup.py
import sqlite3
from contextlib import contextmanager
from logger_config import get_logger
logger = get_logger(__name__)
@contextmanager
def get_db_connection():
conn = sqlite3.connect('articles.db')
conn.row_factory = sqlite3.Row
yield conn
conn.close()
def get_last_id():
with get_db_connection() as conn:
cursor = conn.execute("SELECT MAX(finnhub_id) FROM articles")
result = cursor.fetchone()[0]
last_id = result if result is not None else 0 # Return 0 if no rows found
logger.info('Retrieved last_id from database: %s', last_id)
return last_id
def init_db():
logger.info("Initializing DB...")
with get_db_connection() as conn:
conn.execute('''CREATE TABLE IF NOT EXISTS articles (
id INTEGER PRIMARY KEY,
finnhub_id INTEGER UNIQUE,
category TEXT,
datetime INTEGER,
headline TEXT,
image TEXT,
related TEXT,
source TEXT,
summary TEXT,
url TEXT,
is_classified INTEGER DEFAULT 0,
classification TEXT,
market_sentiment REAL DEFAULT 0, -- Calculated sentiment score from -5 to 5
industry_category TEXT, -- Calculated industry category (GICS)
classification_model TEXT, -- Model used for classification
provider TEXT -- Provider used for classification
)''')
logger.info("DB initialization completed.")
def reset_classifications():
with get_db_connection() as conn:
conn.execute('''UPDATE articles
SET is_classified = 0,
classification = NULL,
market_sentiment = 0,
industry_category = NULL,
classification_model = NULL''')
conn.commit()
logger.info("Reset classifications for all articles.")
# main function to test setup
if __name__ == '__main__':
init_db()
logger.info('Last Article ID: %s' % get_last_id())
logger.info('Database setup complete.')