In [1]:
from IPython.display import clear_output

In [2]:
!pip install langchain deeplake langchain_mistralai tiktoken newspaper3k requests
clear_output()
!pip list

Package                          Version
-------------------------------- ---------------------
absl-py                          1.4.0
accelerate                       0.32.1
aioboto3                         13.1.1
aiobotocore                      2.13.1
aiofiles                         24.1.0
aiohappyeyeballs                 2.4.0
aiohttp                          3.10.5
aioitertools                     0.11.0
aiosignal                        1.3.1
alabaster                        0.7.16
albucore                         0.0.13
albumentations                   1.4.14
altair                           4.2.2
annotated-types                  0.7.0
anyio                            3.7.1
argon2-cffi                      23.1.0
argon2-cffi-bindings             21.2.0
array_record                     0.5.1
arviz                            0.18.0
asn1crypto                       1.5.1
astropy                          6.1.2
astropy-iers-data                0.2024.8.19.0.32.16
astunparse          

In [3]:
import json
import os
from google.colab import userdata

os.environ['LANGCHAIN_TRACING_V2'] = 'true'
os.environ['LANGCHAIN_ENDPOINT'] = 'https://api.smith.langchain.com'
os.environ['LANGCHAIN_API_KEY'] = userdata.get('LANGCHAIN_API_KEY')
os.environ["MISTRAL_API_KEY"] = userdata.get('MISTRAL_API')
os.environ["HUGGINGFACEHUB_API_TOKEN"] = userdata.get('HF_TOKEN')
os.environ["ACTIVELOOP_TOKEN"] = userdata.get('ACTIVELOOP_API')
# os.environ["GOOGLE_API_KEY"] = userdata.get('GOOGLE_KEY')
# os.environ["GOOGLE_CSE_ID"] = userdata.get('GOOGLE_CSE_ID')

In [5]:
import requests
from newspaper import Article

headers = {
    'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/89.0.4389.82 Safari/537.36'
}

article_url = "https://www.artificialintelligence-news.com/2022/01/25/meta-claims-new-ai-supercomputer-will-set-records/"

session = requests.Session()

try:
  response = session.get(article_url, headers = headers, timeout = 10)

  if response.status_code == 200:
    article = Article(article_url)
    article.download()
    article.parse()

    print(f"Title: {article.title}")
    print(f"Text: {article.text}")

  else:
    print(f"Failed to fetch article at {article_url}")
except Exception as e:
    print(f"Error occurred while fetching article at {article_url}: {e}")


Title: Meta claims its new AI supercomputer will set records
Text: Ryan Daws is a senior editor at TechForge Media with over a decade of experience in crafting compelling narratives and making complex topics accessible. His articles and interviews with industry leaders have earned him recognition as a key influencer by organisations like Onalytica. Under his leadership, publications have been praised by analyst firms such as Forrester for their excellence and performance. Connect with him on X (@gadget_ry) or Mastodon (@gadgetry@techhub.social)

Meta (formerly Facebook) has unveiled an AI supercomputer that it claims will be the world’s fastest.

The supercomputer is called the AI Research SuperCluster (RSC) and is yet to be fully complete. However, Meta’s researchers have already begun using it for training large natural language processing (NLP) and computer vision models.

RSC is set to be fully built in mid-2022. Meta says that it will be the fastest in the world once complete and 

In [6]:
from langchain.schema import HumanMessage

article_title = article.title
article_text = article.text

template = """You are a very good assistant that summarizes online articles.

Here's the article you want to summarize.

==================
Title: {article_title}

{article_text}
==================

Write a summary of the previous article.
"""

prompt = template.format(article_title=article_title, article_text=article_text)
messages = [HumanMessage(content=prompt)]

In [7]:
from langchain_mistralai import ChatMistralAI

chat = ChatMistralAI(temperature=0)

In [11]:
summary = chat.invoke(messages)
summary.content

"Meta, formerly Facebook, has announced its new AI supercomputer, the AI Research SuperCluster (RSC), which it claims will be the world's fastest once completed in mid-2022. The supercomputer is currently being used to train large NLP and computer vision models. Meta aims for RSC to be capable of training models with trillions of parameters, which will enable real-time voice translations for large groups of people speaking different languages. The supercomputer is expected to be 20x faster than Meta's current V100-based clusters and will allow Meta to use real-world examples from its production systems for training, improving tasks such as identifying harmful content on its platforms. RSC has been designed with security and privacy controls in mind, and Meta believes it is the first time performance, reliability, security, and privacy have been tackled at such a scale. The supercomputer will support Meta's development of the metaverse, where AI-driven applications and products will pla

In [13]:
template = """You are an advanced AI assistant that summarizes online articles into bulleted lists.

Here's the article you need to summarize.

==================
Title: {article_title}

{article_text}
==================

Now, provide a summarized version of the article in a bulleted list format.
"""
prompt = template.format(article_title=article.title, article_text=article.text)
messages = [HumanMessage(content=prompt)]

In [14]:
summary = chat.invoke(messages)
summary.content

"- Meta, formerly Facebook, has announced its new AI supercomputer, the AI Research SuperCluster (RSC).\n- The RSC is currently being used for training large NLP and computer vision models, with completion expected in mid-2022.\n- Meta claims that the RSC will be the world's fastest AI supercomputer once completed, capable of training models with trillions of parameters.\n- The RSC is expected to be 20x faster than Meta's current V100-based clusters for production and 3x faster for training large-scale NLP workflows.\n- With RSC, a model with tens of billions of parameters can finish training in three weeks compared to nine weeks previously.\n- RSC is designed with security and privacy controls in mind, allowing Meta to use real-world examples from its production systems for training, improving tasks such as identifying harmful content.\n- This is the first time performance, reliability, security, and privacy have been addressed at such a scale, according to Meta.\n- The RSC will help 

In [15]:
template = """You are an advanced AI assistant that summarizes online articles into bulleted lists.

Here's the article you need to summarize.

==================
Title: {article_title}

{article_text}
==================

Now, provide a summarized version of the article in a bulleted list format, in French.
"""
prompt = template.format(article_title=article.title, article_text=article.text)
messages = [HumanMessage(content=prompt)]

In [16]:
summary = chat.invoke(messages)
summary.content

"- Ryan Daws, rédacteur en chef de TechForge Media, a annoncé que Meta (anciennement Facebook) a dévoilé un superordinateur d'intelligence artificielle (IA) appelé AI Research SuperCluster (RSC).\n- RSC est en cours de construction et sera, selon Meta, le superordinateur le plus rapide du monde une fois achevé mi-2"