TelegramAktienBot/telegram_bot/news/news_fetcher.py

83 lines
2.2 KiB
Python
Raw Normal View History

2022-03-15 08:05:28 +00:00
"""
script for news fetching (by keywords)
"""
__author__ = "Florian Kellermann, Linus Eickhoff"
__date__ = "15.03.2022"
__version__ = "0.0.1"
2022-03-15 09:39:29 +00:00
__license__ = "None"
2022-03-29 10:04:49 +00:00
from ast import parse
2022-03-15 09:39:29 +00:00
import sys
2022-03-15 13:01:33 +00:00
import os
import json
2022-03-16 12:32:26 +00:00
import requests
2022-03-29 11:37:44 +00:00
import datetime as dt
2022-03-15 13:01:33 +00:00
from newsapi import NewsApiClient
from dotenv import load_dotenv
load_dotenv()
2022-03-15 10:27:54 +00:00
# Init
2022-03-16 12:32:26 +00:00
api_key = os.getenv('NEWS_API_KEY')
newsapi = NewsApiClient(api_key=api_key)
source_json = requests.get(f"https://newsapi.org/v2/top-headlines/sources?apiKey={api_key}&language=en").json()
sources = source_json["sources"]
str_sources = ",".join([source["id"] for source in sources])
2022-03-15 10:27:54 +00:00
2022-03-29 11:37:44 +00:00
def get_all_news_by_keyword(keyword, from_date="2000-01-01"): # hard coded will change soon
2022-03-29 10:28:28 +00:00
"""get all news to keyword
2022-03-15 13:43:05 +00:00
Args:
keyword (String): keyword for search
2022-03-29 11:37:44 +00:00
from_date (String): min date for search
2022-03-15 13:43:05 +00:00
Returns:
JSON/dict: dict containing articles
2022-03-29 10:04:49 +00:00
"""
2022-03-29 11:37:44 +00:00
top_headlines = newsapi.get_everything(q=keyword, sources=str_sources, language='en', from_param=from_date)
2022-04-04 16:57:59 +00:00
if(top_headlines["status"] == "ok"):
return top_headlines
else:
return None
def get_top_news_by_keyword(keyword):
"""get top news to keyword
Args:
keyword (String): keyword for search
Returns:
JSON/dict: dict containing articles
"""
top_headlines = newsapi.get_top_headlines(q=keyword, sources=str_sources, language='en')
if(top_headlines["status"] == "ok"):
return top_headlines
else:
return None
def format_article(article):
2022-03-15 13:43:05 +00:00
"""format article for messaging (using markdown syntax)
Args:
article (dict): article to format for messaging
Returns:
String: formatted article
"""
sourcename = article["source"]["name"]
headline = article["title"]
url = article["url"]
2022-03-15 13:24:11 +00:00
formatted_article = f"_{sourcename}_\n*{headline}*\n\n{url}"
return formatted_article
2022-03-15 09:39:29 +00:00
if __name__ == '__main__':
2022-03-15 13:24:11 +00:00
2022-03-29 11:37:44 +00:00
print("this is a module and should not be run directly")
print("fetching top news by keyword bitcoin...")
2022-03-15 13:01:33 +00:00
2022-03-29 10:29:13 +00:00
articles = get_all_news_by_keyword("bitcoin")
2022-03-15 13:01:33 +00:00
formatted_article = format_article(articles["articles"][0])
print(formatted_article)