In [24]:
from langchain_text_splitters import RecursiveCharacterTextSplitter
import wikipediaapi
import google.generativeai as genai
import PyPDF2
from langchain_community.document_loaders import WebBaseLoader
import requests
from bs4 import BeautifulSoup
from langchain.llms import Ollama
from langchain_community.embeddings import OllamaEmbeddings
from langchain_chroma import Chroma
import dotenv

In [25]:
api_key = dotenv.get_key(".env" , key_to_get="GEMINI_API_KEY")
genai.configure(api_key=api_key)

In [26]:
gen_config = genai.GenerationConfig(temperature=0.4)
model = genai.GenerativeModel( "models/gemini-1.5-flash" , generation_config=gen_config )

In [33]:
weburl = "https://www.gov.uk/government/publications/research-on-the-cyber-security-of-ai/ai-cyber-security-survey-main-report"
loader = WebBaseLoader(weburl)
loader.requests_kwargs = {'verify':False}
data = loader.load()



In [34]:
data = str(data)

In [36]:
data

"[Document(page_content='\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n      AI cyber security survey - main report  - GOV.UK\\n  \\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\nCookies on GOV.UK\\n\\nWe use some essential cookies to make this website work.\\nWe’d like to set additional cookies to understand how you use GOV.UK, remember your settings and improve government services.\\nWe also use cookies set by other sites to help us deliver content from their services.\\nYou have accepted additional cookies. You can change your cookie settings at any time.\\nYou have rejected additional cookies. You can change your cookie settings at any time.\\n\\n\\n\\n\\nAccept additional cookies\\nReject additional cookies\\nView cookies\\n\\n\\n\\n          Hide this message\\n        \\n\\n\\n\\nSkip to main content\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n \\n\\n\\n                GOV.UK\\n              \\n\\n\\n \\n\\n\\n  

In [35]:

text_splitter = RecursiveCharacterTextSplitter(
    chunk_size=100000, 
    chunk_overlap=30,
    separators=['.','\n','\n\n']
)

In [30]:
texts = text_splitter.split_text(data)

In [31]:
texts

["[Document(page_content='\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n      AI cyber security survey - main report  - GOV.UK\\n  \\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\nCookies on GOV.UK\\n\\nWe use some essential cookies to make this website work.\\nWe’d like to set additional cookies to understand how you use GOV.UK, remember your settings and improve government services.\\nWe also use cookies set by other sites to help us deliver content from their services.\\nYou have accepted additional cookies. You can change your cookie settings at any time.\\nYou have rejected additional cookies. You can change your cookie settings at any time.\\n\\n\\n\\n\\nAccept additional cookies\\nReject additional cookies\\nView cookies\\n\\n\\n\\n          Hide this message\\n        \\n\\n\\n\\nSkip to main content\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n\\n \\n\\n\\n                GOV.UK\\n              \\n\\n\\n \\n\\n\\n 

In [32]:
summarized_content = " "
for text in texts:
    response = model.generate_content(
        f"""You are a cyber security expert and an expert summarizer. The given text is from a website. Summarize in bulletin points.
        {text}
        """
    )
    summarized_content += response.text
    print(response.text)

## AI Cyber Security Survey - Main Report Summary

**1. Executive Summary:**

**(i) Purpose:** The survey, commissioned by the Department for Science, Innovation and Technology (DSIT), aimed to understand AI usage and cyber security practices in UK businesses.

**(ii) Methodology:** 350 interviews were conducted with businesses using or considering AI across nine sectors using Computer Assisted Telephone Interviewing (CATI).

**(iii) Key Findings:**

* **AI Adoption:** 
    * 68% of businesses are currently using AI, with 38% using natural language processing and generation.
    * Over half of businesses have been using AI for at least a year, with 52% using machine learning for over 3 years.
    * Most AI technologies are adopted through purchasing external software or ready-to-use systems.
* **Cyber Security Practices:**
    * Nearly half of businesses using AI (47%) have no specific cyber security practices in place for AI.
    * 39% of businesses don't expect specific cyber securit