test now passing
This commit is contained in:
parent
4fd69602f7
commit
462e34013e
@ -1,13 +1,14 @@
|
||||
import logging
|
||||
import asyncio
|
||||
from typing import Union, List, Dict
|
||||
from datetime import datetime
|
||||
|
||||
from aiohttp.client import ClientSession
|
||||
from bs4 import BeautifulSoup
|
||||
from bs4.element import Tag
|
||||
from webutils import in_async_session, gather_in_batches
|
||||
|
||||
from .constants import (HTML_PARSER, BASE_URL, END_DATE, BS, IS, CF, FIN_STMT_URL_SUFFIX, FIN_STMT_ITEMS,
|
||||
from .constants import (DEV_MODE, HTML_PARSER, BASE_URL, END_DATE, BS, IS, CF, FIN_STMT_URL_SUFFIX, FIN_STMT_ITEMS,
|
||||
DEFAULT_CONCURRENT_BATCH_SIZE)
|
||||
from .exceptions import UnknownFinancialStatementItem
|
||||
|
||||
@ -56,13 +57,16 @@ def find_relevant_table_rows(soup: BeautifulSoup) -> List[Tag]:
|
||||
"""
|
||||
Returns the table rows containing the data of interest.
|
||||
"""
|
||||
now = datetime.utcnow()
|
||||
trs = []
|
||||
for tr in soup.find('div', attrs={'class': 'financials'}).tbody.find_all('tr'):
|
||||
try:
|
||||
if is_relevant_table_row(tr):
|
||||
trs.append(tr)
|
||||
except UnknownFinancialStatementItem:
|
||||
pass
|
||||
if DEV_MODE:
|
||||
with open(f'mwfin_unknown_items_{now.strftime("%Y-%m-%d_%H-%M-%S")}.html', 'w') as f:
|
||||
f.write(str(soup))
|
||||
return trs
|
||||
|
||||
|
||||
|
Loading…
Reference in New Issue
Block a user