In [1]:
import datetime as dt
import gdelt as gd
from newspaper import Article
import nltk
import spacy
from spacy import displacy

In [2]:
# Download the trained pipeline package
#!python -m spacy download en_core_web_sm

In [3]:
gdelt_client = gd.gdelt()

In [4]:
date = dt.datetime.now() - dt.timedelta(days=7)
date_string = date.strftime('%Y %m %d')
gdelt_events = gdelt_client.Search(date_string, table='events', coverage=True)

In [5]:
#highest_count = gdelt_events['SOURCEURL'].value_counts()[0]
#gdelt_events.groupby('SOURCEURL').filter(lambda value_count: len(value_count) == highest_count)

def get_mode_url(events):
    return events['SOURCEURL'].mode()[0]

def get_most_common_urls(events, count):
    return events['SOURCEURL'].value_counts()[0:count].index.to_list()

def create_nlp():
    return spacy.load('en_core_web_sm')

def prepare_parsing():
    nltk.download('punkt')

def get_parsed_article(url):
    article = Article(url)
    article.download()
    article.parse()
    article.nlp()
    return article

def print_article(article):
    print(article.title)
    print(article.publish_date)
    print(article.keywords)
    print(article.summary)

def print_articles(urls):
    prepare_parsing()
    for url in urls:
        article = get_parsed_article(url)
        print_article(article)
        print('')
        
def pprint_articles(urls):
    prepare_parsing()
    nlp = create_nlp()
    for url in urls:
        article = get_parsed_article(url)
        print_article(article)
        article_doc = nlp(article.text)
        displacy.render(article_doc, style='ent')
        print('')


In [6]:
urls = get_most_common_urls(gdelt_events, 5)
pprint_articles(urls)

[nltk_data] Downloading package punkt to
[nltk_data]     /home/gisfromscratch/nltk_data...
[nltk_data]   Package punkt is already up-to-date!


History of Ahmadiyya in Singapore
2021-07-04 00:00:00
['history', 'muhammad', 'sahib', 'singapore', 'missionary', 'came', 'jemaat', 'maulvi', 'maulana', 'ahmadiyyat', 'ahmadiyya', 'left']
Furthermore, Mathew Finlay wrote to the President of the Jemaat Ahmadiyya in Singapore, Abdul Hamid Salikin, not to publish that debate.
Whereupon during the time of Maulvi Muhammad Siddiq Sahib that they build the first mosque which was called the Masjid Ahmadiyya Singapura.
b) Hazrat Sir Zafrullah Khan Sahib r.a.c) Hazrat Maulvi Muhammad Hussain Sahib who came to Singapore in 1984.
In that debate Maulvi Khairuddin Barus Sahib of Indonesia and Maulvi Zoudi Sahib of Malaysia represented the Jemaat Ahmadiyya of Singapore.
source Ahmadiyya Muslim Mission Singapore » History of Ahmadiyya in Singapore



Coronavirus in Russia: The Latest News
2021-07-03 00:00:00
['russias', 'vaccine', 'announced', 'vaccination', 'moscow', 'latest', 'covid19', 'authorities', 'coronavirus', 'russia', 'city']
Russia has confirmed 5,783,333 cases of coronavirus and 143,002 deaths , according to the national coronavirus information center.
— A senior administrator at a western Russian clinic has been detained on suspicion of selling fake coronavirus vaccine certificates, police said Wednesday.
— Russia could allow pregnant women to start receiving the coronavirus vaccine within the next one to two weeks, Health Minister Mikhail Murashko said.
— Moscow authorities announced a “non-working week” from June 15-19 in an attempt to curb the growing number of infections.
— Serbia is starting to produce Russia's Sputnik V coronavirus vaccine, President Aleksandar Vucic said on Friday, the first European nation outside Russia and Belarus to take the step.



Palestinian Killed, Scores Injured and Abducted, More Air Strikes on Gaza by Israeli Occupation Forces, July 4, 2021
2021-07-04 00:00:00
['palestinians', 'scores', 'palestinian', 'strikes', 'west', 'injured', 'bank', 'forces', 'israeli', 'soldiers', 'killed', 'air', 'protests', 'including', 'gaza', 'occupation']
Israeli Occupation Army Fires Missiles Into GazaIMEMC, July 4, 2021The Israeli occupation army fired, on Saturday at night, several missiles into a site, south of Gaza city, and another area northeast of the city.
In the West Bank, including East Jerusalem, 28 Palestinians, including five children, were killed as of 24 May.
Israeli Occupation Army Injures Dozens in West Bank Protests Against SettlementsIMEMC, July 4, 2021Scores of Palestinian demonstrators were injured, on Friday, when Israeli occupation forces attacked peaceful protests across the occupied West Bank, the Palestinian WAFA News Agency reported.
Israeli Occupation Soldiers Army Abducts Three Palestinians In Jeru


Egyptian man, 24, who stabbed father-of-12 rabbi outside a Boston synagogue overstayed student visa
2021-07-04 06:08:38+01:00
['community', 'outside', 'visa', 'awad', 'jewish', 'overstayed', 'noginski', 'rabbi', 'man', 'attack', 'boston', 'synagogue', 'hate', 'egyptian', 'shaloh', 'stabbed', 'fatherof12', 'student']
Rollins attended a community vigil on Friday morning with Mayor Kim Janey where the attack against Rabbi Noginski allegedly took place.
Hours later, another image was shared from the hospital which showed Rabbi Noginski lying on a bed while looking at the camera.
Boston's Jewish community is angry, living in fear and need answers, accountability and security.'
Rabbi Rodkin said in a statement on Thursday: 'Earlier today, Rabbi Shlomo Noginski was attacked on the street outside the Shaloh House.
'We are all very shaken by what happened and ask for you to please keep Rabbi Noginski in your prayers for a... speedy and complete recovery.




None
[]








In [6]:
urls
#print_article(article)

['https://www.msn.com/en-xl/middleeast/top-stories/iran-astana-process-puts-forward-solution-to-syria-issue/ar-AALZeu2',
 'https://www.deccanherald.com/opinion/indias-co-win-redemption-1006995.html',
 'https://www.msn.com/en-xl/news/other/from-pakistan-to-zambia-how-does-china-pick-its-ironclad-friends/ar-AAM02e6',
 'https://www.japantimes.co.jp/news/2021/07/10/world/afghanistan-pilots-us-military/',
 'https://pajhwok.com/2021/07/10/civilian-casualties-resurge-amid-peace-push/']