97 lines
3.2 KiB
Python
97 lines
3.2 KiB
Python
import logging
|
|
import asyncio
|
|
import csv
|
|
import json
|
|
from argparse import ArgumentParser
|
|
from pathlib import Path
|
|
from typing import Dict
|
|
|
|
from .functions import get_company_financials, ResultDict
|
|
from .constants import END_DATE, MAIN_LOGGER_NAME
|
|
|
|
|
|
log = logging.getLogger(MAIN_LOGGER_NAME)
|
|
|
|
JSON_EXT, CSV_EXT = '.json', '.csv'
|
|
|
|
TICKER_SYMBOL = 'ticker_symbol'
|
|
QUARTERLY = 'quarterly'
|
|
TO_FILE = 'to_file'
|
|
JSON_INDENT = 'json_indent'
|
|
VERBOSE = 'verbose'
|
|
|
|
|
|
def parse_cli() -> dict:
|
|
parser = ArgumentParser(description="Scrape company financials")
|
|
parser.add_argument(
|
|
TICKER_SYMBOL,
|
|
type=str,
|
|
help="Stock ticker symbol of the company to be scraped the financials of"
|
|
)
|
|
parser.add_argument(
|
|
'-Q', f'--{QUARTERLY}',
|
|
action='store_true',
|
|
help="If set, the financial data for the last quarters is returned; otherwise yearly data is returned."
|
|
)
|
|
parser.add_argument(
|
|
'-f', f'--{TO_FILE.replace("_", "-")}',
|
|
type=Path,
|
|
help="Writes results to the specified destination file. If omitted results are printed to stdout. "
|
|
"Depending on the file name suffix, the output format can be either as CSV or in JSON."
|
|
)
|
|
parser.add_argument(
|
|
f'--{JSON_INDENT.replace("_", "-")}',
|
|
type=int,
|
|
help="If set to a positive integer and the output format is JSON (default), the resulting JSON document is "
|
|
"indented accordingly for more readability; if omitted, output is returned in one line."
|
|
)
|
|
parser.add_argument(
|
|
'-v', f'--{VERBOSE}',
|
|
action='count',
|
|
default=0,
|
|
help="Verbose mode. Reduces the log level and thus prints out more status messages while running. "
|
|
"Using this flag multiple times increases verbosity further."
|
|
)
|
|
return vars(parser.parse_args())
|
|
|
|
|
|
def configure_logging(verbosity: int) -> None:
|
|
root_logger = logging.getLogger()
|
|
root_logger.addHandler(logging.StreamHandler())
|
|
if verbosity > 2:
|
|
root_logger.setLevel(logging.DEBUG)
|
|
elif verbosity == 2:
|
|
root_logger.setLevel(logging.INFO)
|
|
elif verbosity == 1:
|
|
root_logger.setLevel(logging.WARNING)
|
|
|
|
|
|
def write_to_csv(data: Dict[str, ResultDict], file_obj) -> None:
|
|
writer = csv.writer(file_obj)
|
|
for statement_key, statement_dict in data.items():
|
|
end_dates = statement_dict.pop(END_DATE)
|
|
writer.writerow([statement_key] + list(end_dates))
|
|
for key, values in statement_dict.items():
|
|
writer.writerow([key] + list(str(val) for val in values))
|
|
|
|
|
|
async def main() -> None:
|
|
args = parse_cli()
|
|
configure_logging(args[VERBOSE])
|
|
data = await get_company_financials(args[TICKER_SYMBOL], quarterly=args[QUARTERLY])
|
|
path: Path = args[TO_FILE]
|
|
if path is None:
|
|
print(json.dumps(data, indent=args[JSON_INDENT]))
|
|
return
|
|
with open(path, 'w') as f:
|
|
if path.suffix.lower() == CSV_EXT:
|
|
write_to_csv(data, f)
|
|
return
|
|
if not path.suffix.lower() == JSON_EXT:
|
|
log.warning(f"Extension '{path.suffix}' unknown; using JSON format")
|
|
json.dump(data, f, indent=args[JSON_INDENT])
|
|
|
|
|
|
if __name__ == '__main__':
|
|
asyncio.run(main())
|