fix markup parsing

This commit is contained in:
Evgeny Zinoviev 2021-09-18 16:33:05 +03:00
parent ed1bd77440
commit a153106894

View File

@ -1,9 +1,10 @@
#!/usr/bin/env python3 #!/usr/bin/env python3
import sys, traceback import traceback
from requests import get from requests import get
from bs4 import BeautifulSoup from bs4 import BeautifulSoup
from ch1p import State, telegram_notify from ch1p import State, telegram_notify
from html import escape from html import escape
from argparse import ArgumentParser
def scrap_announcements(): def scrap_announcements():
@ -23,10 +24,7 @@ def scrap_announcements():
} }
for link in c.find_next('div').select('a[data-bn-type="link"]'): for link in c.find_next('div').select('a[data-bn-type="link"]'):
id = link.get('id') if link.text.strip().lower() == 'view more':
if id is None:
continue
if not link.get('id').startswith('supportList'):
continue continue
href = link.get('href') href = link.get('href')
@ -47,6 +45,10 @@ def scrap_announcements():
if __name__ == '__main__': if __name__ == '__main__':
parser = ArgumentParser()
parser.add_argument('--stdout', action='store_true')
args = parser.parse_args()
state = State(default=dict(urls=[])) state = State(default=dict(urls=[]))
try: try:
blocks = [] blocks = []
@ -66,7 +68,14 @@ if __name__ == '__main__':
if blocks: if blocks:
message = '<b>Binance Announcements</b>\n\n' message = '<b>Binance Announcements</b>\n\n'
message += '\n\n'.join(blocks) message += '\n\n'.join(blocks)
telegram_notify(text=message, parse_mode='HTML', disable_web_page_preview=True)
if args.stdout:
print(message)
else:
telegram_notify(text=message, parse_mode='HTML', disable_web_page_preview=True)
except: except:
telegram_notify(text='error: ' + escape(traceback.format_exc()), parse_mode='HTML') if args.stdout:
traceback.print_exc()
else:
telegram_notify(text='error: ' + escape(traceback.format_exc()), parse_mode='HTML')