""" script for news fetching (by keywords) """ __author__ = "Florian Kellermann, Linus Eickhoff" __date__ = "15.03.2022" __version__ = "0.0.1" __license__ = "None" import sys import os import json import pandas as pd from newsapi import NewsApiClient from dotenv import load_dotenv load_dotenv() # Init newsapi = NewsApiClient(api_key=os.getenv('NEWS_API_KEY')) # /v2/top-headlines top_headlines = newsapi.get_top_headlines(q='bitcoin', sources='bbc-news,the-verge', language='en') # /v2/everything all_articles = newsapi.get_everything(q='bitcoin', sources='bbc-news,the-verge', domains='bbc.co.uk,techcrunch.com', from_param='2022-03-14', to='2022-03-15', language='en', sort_by='relevancy', page=2) # /v2/top-headlines/sources sources = newsapi.get_sources() def get_top_news_by_keyword(keyword): top_headlines = newsapi.get_top_headlines(q=keyword, sources='bbc-news,the-verge,cnn', language='en') out_file = open("top_headline.json", "w") json.dump(top_headlines, out_file) return top_headlines def format_article(article): sourcename = article["source"]["name"] headline = article["title"] url = article["url"] formatted_article = f"{sourcename}\n{headline}\n\ntext" return formatted_article if __name__ == '__main__': print("fetching top news by keyword business...") articles = get_top_news_by_keyword("business") formatted_article = format_article(articles["articles"][0]) print(formatted_article)