-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathmain.py
117 lines (87 loc) · 3.8 KB
/
main.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
import argparse
import datetime
import re
from bs4 import BeautifulSoup
from selenium import webdriver
import yaml
def load_configuration(file='.config'):
"""
Load configuration from YAML file.
Format is like:
Institution:
AccountName:
- AAPL
- MSFT
- AMZN
- GOOGL
- FB
There can be any number of institutions and accounts specified.
"""
# Disclaimer: The stocks listed above are examples only,
# and are not to be taken as a recommendation or endorsement.
with open(file, 'r') as f:
return yaml.safe_load(f)
def format_stock_price(date_str, symbol, currency, price):
# The date string is formatted like '2023-05-10', but we want to output like '2023/05/10'.
#
# For the output line,
# the symbol starts at col 25, (so date width will be 25, less 2 (for 'P '), less 1 (ends at col 39))
# currency at col 40, (so symbol width will be 15)
# price decimal is placed at col 50. (so currency width will be 10 less space in front of decimal)
#
return f"P {date_str.replace('-', '/'):<22}{symbol:<15}{currency:<{10 - price.index('.')}}{price}"
def get_stock_price(webdriver, symbol, date_str):
"""Return currency and price as a tuple."""
url = f'https://ca.finance.yahoo.com/quote/{symbol}/history'
webdriver.get(url)
soup = BeautifulSoup(webdriver.page_source, 'lxml')
# Find the price by keying on the date (determine the row),
# so we need to format it to match, eg. 'Nov 4, 2024'.
date_obj = datetime.datetime.strptime(date_str, '%Y-%m-%d')
[month, day_padded, year] = list(map(date_obj.strftime, ['%b', '%d', '%Y']))
date_text = f'{month} {int(day_padded)}, {year}'
date_td = soup.find('td', string=date_text)
if date_td is None:
raise ValueError(f'No data available for {symbol} on {date_str}.')
# After determining the row we'll then traverse the HTML
# to find the price at market close.
# For some reason we have to traverse 2 siblings per table cell.
price_at_close_cell = date_td
for _ in range(8):
price_at_close_cell = price_at_close_cell.nextSibling
price = price_at_close_cell.contents[0].string
# Grab the currency by looking for the specific phrase in which it appears.
currency_span = soup.find('span', string=re.compile(r'^Currency in \w{3}'))
currency = currency_span.contents[0].string[-3:]
return currency, f'{float(price):.2f}'
if __name__ == '__main__':
parser = argparse.ArgumentParser(description=(
'Get historical price information for given stock symbols '
'and return the data in a format suitable for Ledger CLI.'
))
parser.add_argument('date', metavar='YYYY-MM-DD', type=str, help='A date in the format YYYY-MM-DD.')
parser.add_argument('--verbose', '-v', action='store_true', help='Enable verbose output.')
parser.add_argument(
'--output-file', '-o',
dest='output', metavar='output.txt',
type=str, default='output.txt',
help='Output file name, defaults to `output.txt`.'
)
args = parser.parse_args()
data = load_configuration()
output = []
driver = webdriver.Firefox()
for institution in data.keys():
if args.verbose:
print(f'Processing `{institution}` institution..')
output.append(f'; {institution}')
for account in data[institution].keys():
output.append(f'; {account}')
for symbol in data[institution][account]:
currency, price = get_stock_price(driver, symbol, args.date)
output.append(format_stock_price(args.date, symbol, currency, price))
driver.quit()
with open(args.output, 'w') as f:
f.write('\n'.join(output))
if args.verbose:
print(f'Output successfully written to {args.output}.')