In [7]:
# Import libraries
import os
from pprint import pprint

import keras
import numpy as np
from cleantext import clean
from dotenv import load_dotenv
from newsapi import NewsApiClient
import spacy
from spacy import displacy

In [8]:
# Load environment secrets from `.env` file
load_dotenv()

os.environ["HTTPS_PROXY"] = "http://test:test123@172.31.2.3:8080"

# Initialize the API client with the API key
API_KEY = os.environ["NEWSAPI_KEY"]
api = NewsApiClient(api_key=API_KEY)

# Fetch the latest top-headlines in India
headlines = api.get_top_headlines(country="in")
pprint(headlines)

{'articles': [{'author': 'ANI',
               'content': 'The tech giant is shifting the way it presents '
                          'search results to incorporate conversations with '
                          'artificial intelligence, along with more short '
                          'video and social-media posts, a departure from the '
                          'list … [+764 chars]',
               'description': 'California, May 7: Google is planning to make '
                              'its search engine more "visual, snackable, '
                              'personal, and human," with a focus on serving '
                              'young people globally, Th',
               'publishedAt': '2023-05-08T00:06:14Z',
               'source': {'id': None, 'name': 'Greater Kashmir'},
               'title': 'Google plans to make search more ‘personal’ with AI '
                        'chat, video clips - Greater Kashmir',
               'url': 'https://www.greaterkashmir.com/

In [9]:
# spacy.cli.download("en_core_web_lg")
NER = spacy.load("en_core_web_lg")

def spacy_large_ner(document):
    return {(ent.text.strip(), ent.label_) for ent in NER(document).ents}

def display_ner_text(text):
    doc = NER(text)
    results = {(ent.text.strip(), ent.label_) for ent in doc.ents}
    displacy.render(doc, style="ent", jupyter=True)

In [10]:
# Specify which model to use
MODEL_FILEPATH = f"../models/models-1683093761.h5"

# Load the model
model = keras.models.load_model(MODEL_FILEPATH)

def classify_text(text):
    cleaned_text = clean(text)
    prediction = model.predict(np.array([cleaned_text]), verbose=0)[0][0]
    return prediction


articles = headlines["articles"]

for article in articles:
    title = article["title"]
    description = article["description"]
    published_at = article["publishedAt"]
    url = article["url"]

    classify = classify_text(description)
    print(f"Title: {title}")
    print(f"Description: {description}")
    print(f"Classification: {classify}")
    print()

    display_ner_text(description)

Title: Google plans to make search more ‘personal’ with AI chat, video clips - Greater Kashmir
Description: California, May 7: Google is planning to make its search engine more "visual, snackable, personal, and human," with a focus on serving young people globally, Th
Classification: 0.7891131639480591



Title: BJP provided ‘corruption rate-cards’: DK Shivakumar on ECI's notice on ads - Hindustan Times
Description: On Friday, the BJP alleged that Congress was making false allegations of corruption against them and filed a complaint with the ECI. | Latest News India
Classification: 0.23816132545471191



Title: BJP's Vasundhara Raje's Counter After Ashok Gehlot's Bombshell - NDTV
Description: Senior BJP leader Vasundhara Raje has reacted sharply to Chief Minister Ashok Gehlot's claim that she and two other BJP leaders had helped save his government in 2020 during the revolt of Sachin Pilot.
Classification: 0.5477765202522278



Title: 7 Killed As SUV Runs Over People Waiting At Bus Stop In Texas: Police - NDTV
Description: Seven people died and as many as six others were injured Sunday in Texas when a driver crashed into them outside a facility housing migrants in the southern US state, police said.
Classification: 0.42624130845069885



Title: Exes Akshay Kumar and Raveena Tandon share hugs at HT India's Most Stylish - Hindustan Times
Description: Hindustan Times India’s Most Stylish 2023: Akshay Kumar and Raveena Tandon reunites on stage. | Bollywood
Classification: 0.4818585515022278



Title: RR vs SRH Highlights: Sunrisers Hyderabad hunt down 215 to keep playoffs hopes alive, Rajasthan Royals lo - Times of India
Description: Cricket News: A re-jigged batting order fired in unison as Sunrisers Hyderabad stunned Rajasthan Royals at their home to clinch a high-scoring last-ball IPL thrille
Classification: 0.45742982625961304



Title: 18 dead as tourist boat overturns at Tanur; five children among deceased - Onmanorama
Description: The tragedy occurred at Thooval Theeram, Ottumpuram, a popular tourist destination in Malappuram.
Classification: 0.49380818009376526



Title: Mohammed Siraj, Phil Salt Bury The Hatchet With Brilliant Post-Match Gesture - NDTV Sports
Description: Delhi Capitals registered their third win of IPL 2023 on Saturday after they comfortably defeated Royal Challengers Bangalore by seven wickets
Classification: 0.4774373173713684



Title: Only Women Contingents Likely To Participate In Next Year's Republic Day Parade - Times Now
Description: A memorandum sent to the three services and various ministries and departments by the Defence Ministry says that the Republic Day Parade 2024 will have only women participants in the contingents (marching and band), tableaux and other performances.
Classification: 0.7029017210006714



Title: Viral Videos: Thousands Evacuated As "Unprecedented" Wildfires Ravage Canada - NDTV
Description: Videos going viral on social media show the massive scale of unprecedented wildfires burning in Canada, where thousands of people have been forced to evacuate their homes.
Classification: 0.583849310874939



Title: Congress openly arguing for Karnataka’s secession: PM Modi steps up attack in last leg of poll campaign - The Indian Express
Description: Secretly meeting diplomats who do not like India, tukde tukde gang disease high in Congress, says PM
Classification: 0.47877347469329834



Title: What has spurred ethnic violence in India’s Manipur? - Al Jazeera English
Description: Tribal groups are protesting the prospect of Manipur’s majority Meitei community being recognised as “Scheduled Tribe”.
Classification: 0.4819115996360779



Title: Watch: Wriddhiman Saha`s Trousers Take Center Stage In Hilarious IPL Moment, Hardik Pandya And Mohammed Sha... - Zee News
Description: Pandya vs Pandya: Brotherly Showdown In IPL 2023, 7 Famous Brother Duos Who Played With And Against Each Other In IPLs History - In Pics During his brief time on the field, Sahas trousers were noticed to be the wrong way around, causing laughter among Hardik …
Classification: 0.7439875602722168



Title: PM Modi to Asaduddin Owaisi, this week's top 5 newsmakers - Hindustan Times
Description: Here are the list of top 5 newsmakers this week. | Latest News India
Classification: 0.32230761647224426



Title: 'Gill was getting tired. It'll sound controversial...retire him out': Doull - Hindustan Times
Description: On Sunday, Doull reiterated his milestone theory in a fresh jibe targetting Shubman Gill, who scored 94 runs in the match against Lucknow Super Giants. | Cricket
Classification: 0.9087792634963989



Title: Paytm focused on reaching financial milestone 'in near future': Vijay Shekhar Sharma - Economic Times
Description: Positive free cash flow is when a company has sufficient funds to invest back into the business for growth.
Classification: 0.3781239092350006





Title: Diabetes-Friendly Weight Loss Diets: Try These 2 Diets - Boldsky
Description: Diabetes is a serious condition that can lead to a variety of health problems - one of which is weight gain. While it is important to maintain a healthy weight, it can be difficult for those with diabetes to lose weight – however, we are here to help you out …
Classification: 0.7438589930534363



Title: Viral video shows ‘Grim Reaper’ at King Charles’ Coronation - Hindustan Times
Description: At the Coronation ceremony of King Charles III, a spooky figure was caught on camera and videos of the same have been going crazy viral online. | Trending
Classification: 0.38068220019340515



Title: It's never too late to prioritise your health say experts - Times of India
Description: “The irony of our society is that we prioritise our health only once it starts deteriorating,” shares fitness trainer and nutritionist Diksha Chhabra.
Classification: 0.656067967414856



Title: All about LIGO-India project, which has put country on elite astronomy map - The Federal
Description: What is the LIGO-India project for which the Centre has approved Rs 2,600 crore? When will it start operating and why is it important? Here are your questions answered.
Classification: 0.45994916558265686

