aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authordarroyolpz <darroyolpz@users.noreply.github.com>2019-09-10 19:26:06 +0200
committerGitHub <noreply@github.com>2019-09-10 19:26:06 +0200
commitf05f45fe0c5ba86bb7fa1d27be912b5f4c6cb844 (patch)
tree8e16695f24fe8cbfec711595d8595233a5df0e38
parent63a695834e7e5837d08d46590d07364bff532a09 (diff)
Shorter and more reusable code. Added comments to the functions.
-rw-r--r--binance-scraping-bot.py18
1 files changed, 13 insertions, 5 deletions
diff --git a/binance-scraping-bot.py b/binance-scraping-bot.py
index f96b6d0..45d2150 100644
--- a/binance-scraping-bot.py
+++ b/binance-scraping-bot.py
@@ -25,18 +25,24 @@ api = tweepy.API(auth)
# Binance extract function
def extract_binance(main_webpage, key_words):
- final_item, final_list = [], []
+ # Create an empty string to store matchings
+ final_list = []
+
+ # Scrap the entire web-page
sauce = urllib.request.urlopen(main_webpage).read()
soup = bs.BeautifulSoup(sauce, 'lxml')
+
+ # Extract the announcements
list = soup.find_all('li', class_ = 'article-list-item')
+
+ # Check for matchings
for article in list:
article_text = article.get_text().replace('\n', '')
for item in key_words:
+ # If matching, create a new list
if item in article_text:
- final_item.append(article_text)
- final_item.append('https://www.binance.com' + article.find('a').get('href'))
- final_list.append(final_item)
- final_item = [] # Reset once is in the final_list to not get duplicates
+ article_link = 'https://www.binance.com' + article.find('a').get('href')
+ final_list.append([article_text, article_link])
return final_list
# Telegram function
@@ -56,8 +62,10 @@ def tg_call(update, context):
# Loop pass - Watchdog mode
while True:
+ # Get new list of urls
new_urls = extract_binance(main_webpage, key_words)
for item in new_urls:
+ # Compare if they were included in the former list
if item not in old_urls:
msg = item[0] + '\n' + item[1]
api.update_status(msg) # Twitter