-
Notifications
You must be signed in to change notification settings - Fork 1
/
db_stocks+news+etfs.py
191 lines (159 loc) · 7.58 KB
/
db_stocks+news+etfs.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
import os
import requests
import sqlalchemy as db
import yfinance as yf
import pandas as pd
from sqlalchemy import text
import time
from ib_insync import *
def create_db():
# create database:
engine = db.create_engine('sqlite:///atradebot.db', echo=True)
connection = engine.connect()
metadata = db.MetaData()
# create a single table:
stocks = db.Table('stocks', metadata,
db.Column('id', db.Integer(), primary_key=True),
db.Column('symbol', db.String(255), nullable=True),
db.Column('name', db.String(255), nullable=True),
db.Column('sector', db.String(255), nullable=True),
db.Column('industry', db.String(255), nullable=True),
db.Column('live_price', db.Float(), nullable=True),
db.Column('prev_close', db.Float(), nullable=True),
db.Column('open', db.Float(), nullable=True),
db.Column("volume", db.Integer(), nullable=True),
)
news = db.Table('news', metadata,
db.Column('id', db.Integer(), primary_key=True),
db.Column('symbol', db.String(255), nullable=True),
db.Column('title', db.String(255), nullable=True),
db.Column('news_date', db.String(255), nullable=True),
db.Column('url', db.String(255), nullable=True),
db.Column('source', db.String(255), nullable=True),
db.Column('text', db.String(255), nullable=True),
)
etfs = db.Table("etfs", metadata,
db.Column("id", db.Integer(), primary_key=True),
db.Column("symbol", db.String(255), nullable=True),
db.Column('name', db.String(255), nullable=True),
db.Column('sector', db.String(255), nullable=True),
db.Column('industry', db.String(255), nullable=True),
db.Column('live_price', db.Float(), nullable=True),
db.Column('prev_close', db.Float(), nullable=True),
db.Column('open', db.Float(), nullable=True),
db.Column("volume", db.Integer(), nullable=True),
)
# create table in database:
metadata.create_all(engine)
return engine, connection, stocks, news
if __name__ == "__main__":
engine, connection, stocks, news = create_db()
connection.execute(text("PRAGMA journal_mode=WAL"))
# get list of stocks:
stock_df = pd.read_excel('SP_500_Companies.xlsx')
symbols = stock_df['Symbol'].tolist()
ib = IB()
ib.connect('127.0.0.1', 7496, clientId=1)
news_providers = ib.reqNewsProviders()
codes = '+'.join(news_provider.code for news_provider in news_providers)
# get list of etfs (top 10)
etfs_symbols = ["SPY", "IVV", "VOO", "VTI", "QQQ", "VEA", "VTV", "IEFA", "BND", "VUG"]
# get data for symbols:
for i in symbols[:5]:
trans = connection.begin_nested()
try:
# get stock info
try:
ticker = yf.Ticker(i)
info = ticker.info
stock_values = {
"symbol": i,
'name': info.get('shortName', 'NA'),
'sector': info.get('sector', 'NA'),
'industry': info.get('industry', 'NA'),
'live_price': info.get('regularMarketPrice', 0.0),
'prev_close': info.get('previousClose', 0.0),
'open': info.get('open', 0.0),
'volume': info.get('volume', 0)
}
# Insert the stock into the database
query_stock = db.insert(stocks)
ResultProxy = connection.execute(query_stock, [stock_values])
# Error handling for stock info fetching
except requests.exceptions.HTTPError as error_terminal:
print("HTTPError while fetching stock info for symbol:", i)
except Exception as e: # General exception catch
print("Unexpected error while fetching stock info for symbol:", i)
# Fetch and store news articles
try:
stock = Stock(i, 'SMART', 'USD')
ib.qualifyContracts(stock)
headlines = ib.reqHistoricalNews(stock.conId, codes, '', '', 100)
for headline in headlines:
article_date = headline.time.date()
article = ib.reqNewsArticle(headline.providerCode, headline.articleId)
# Insert the article into the database
news_info = {
'symbol': i,
'title': '', # Title not needed
'news_date': str(article_date),
'url': '', # URL not provided
'source': '', # Source not provided
'text': article.articleText
}
# Insert the news into the database
query_news = db.insert(news)
ResultProxy = connection.execute(query_news, [news_info])
# Error handling for news fetching
except requests.exceptions.HTTPError as error_terminal:
print("HTTPError while fetching news for symbol:", i)
except Exception as e: # General exception catch
print("Unexpected error while fetching news for symbol:", i)
trans.commit()
time.sleep(1)
# Error handling
except Exception as e: # General exception catch
print("Unexpected error:", e)
trans.rollback()
# get data for etf symbols
for i in etfs_symbols:
trans = connection.begin_nested()
try:
try:
#get etf info
ticker = yf.Ticker(i)
info = ticker.info()
etf_values = {
"symbol": i,
'name': info.get('shortName', 'NA'),
'sector': info.get('sector', 'NA'),
'industry': info.get('industry', 'NA'),
'live_price': info.get('regularMarketPrice', 0.0),
'prev_close': info.get('previousClose', 0.0),
'open': info.get('open', 0.0),
'volume': info.get('volume', 0)
}
# Insert etfs into the database:
query_etf = db.insert(etfs)
ResultProxy = connection.execute(query_etf, [etf_values])
# Error handling for ETF info fetching:
except requests.exceptions.HTTPError as error_terminal:
print("HTTPError while fetching stock info for symbol:", i)
except Exception as e: # General exception catch
print("Unexpected error while fetching stock info for symbol:", i)
trans.commit()
time.sleep(1)
# Error handling:
except Exception as e: # General exception catch
print("Unexpected error:", e)
trans.rollback()
# Fetch and print the first 5 stocks from the database after processing
#query = db.select([data]).limit(5)
query = stocks.select().limit(5)
ResultProxy = connection.execute(query)
ResultSet = ResultProxy.fetchall()
for result in ResultSet:
print(result)
connection.execute(text("PRAGMA journal_mode=WAL"))
# Close the connection
connection.close()