In [6]:
from langchain.embeddings.openai import OpenAIEmbeddings
from langchain.vectorstores import DeepLake
from langchain.text_splitter import CharacterTextSplitter
from langchain import OpenAI
from langchain.document_loaders import SeleniumURLLoader
from langchain import PromptTemplate

from dotenv import load_dotenv
load_dotenv()

True

In [3]:
# we'll use information from the following articles
urls = ['https://beebom.com/what-is-nft-explained/',
        'https://beebom.com/how-delete-spotify-account/',
        'https://beebom.com/how-download-gif-twitter/',
        'https://beebom.com/how-use-chatgpt-linux-terminal/',
        'https://beebom.com/how-delete-spotify-account/',
        'https://beebom.com/how-save-instagram-story-with-music/',
        'https://beebom.com/how-install-pip-windows/',
        'https://beebom.com/how-check-disk-usage-linux/']

In [5]:
loader = SeleniumURLLoader(urls=urls)
docs_not_splitted = loader.load()

text_splitter = CharacterTextSplitter(chunk_size=1000, chunk_overlap=0)
docs = text_splitter.split_documents(docs_not_splitted)

Created a chunk of size 1226, which is longer than the specified 1000


In [7]:
embeddings = OpenAIEmbeddings(model="text-embedding-ada-002")

my_activeloop_org_id = "blackorder"
my_activeloop_dataset_name = "customer_support_qa_bot"
dataset_path = f"hub://{my_activeloop_org_id}/{my_activeloop_dataset_name}"
db = DeepLake(dataset_path, embedding_function=embeddings)

db.add_documents(docs)

Your Deep Lake dataset has been successfully created!


|

Dataset(path='hub://blackorder/customer_support_qa_bot', tensors=['embedding', 'id', 'metadata', 'text'])

  tensor      htype       shape      dtype  compression
  -------    -------     -------    -------  ------- 
 embedding  embedding  (127, 1536)  float32   None   
    id        text      (127, 1)      str     None   
 metadata     json      (127, 1)      str     None   
   text       text      (127, 1)      str     None   


 

['f7328c40-3394-11ee-b60b-90e868539f12',
 'f7328c41-3394-11ee-98a7-90e868539f12',
 'f7328c42-3394-11ee-b082-90e868539f12',
 'f7328c43-3394-11ee-b8f9-90e868539f12',
 'f7328c44-3394-11ee-9aea-90e868539f12',
 'f7328c45-3394-11ee-8297-90e868539f12',
 'f7328c46-3394-11ee-9092-90e868539f12',
 'f7328c47-3394-11ee-bdca-90e868539f12',
 'f7328c48-3394-11ee-a0b8-90e868539f12',
 'f7328c49-3394-11ee-9f19-90e868539f12',
 'f7328c4a-3394-11ee-99ea-90e868539f12',
 'f7328c4b-3394-11ee-bac4-90e868539f12',
 'f7328c4c-3394-11ee-b229-90e868539f12',
 'f7328c4d-3394-11ee-b51c-90e868539f12',
 'f7328c4e-3394-11ee-9369-90e868539f12',
 'f7328c4f-3394-11ee-bdf0-90e868539f12',
 'f7328c50-3394-11ee-9e80-90e868539f12',
 'f7328c51-3394-11ee-96ea-90e868539f12',
 'f7328c52-3394-11ee-a556-90e868539f12',
 'f7328c53-3394-11ee-b910-90e868539f12',
 'f7328c54-3394-11ee-ba1e-90e868539f12',
 'f7328c55-3394-11ee-8dfa-90e868539f12',
 'f7328c56-3394-11ee-a04c-90e868539f12',
 'f7328c57-3394-11ee-88e9-90e868539f12',
 'f7328c58-3394-

In [8]:
query = "how to check disk usage in linux?"
docs = db.similarity_search(query)
print(docs[0].page_content)

Home  Tech  How to Check Disk Usage in Linux (4 Methods)

How to Check Disk Usage in Linux (4 Methods)

Beebom Staff

Last Updated: June 19, 2023 5:14 pm

There may be times when you need to download some important files or transfer some photos to your Linux system, but face a problem of insufficient disk space. You head over to your file manager to delete the large files which you no longer require, but you have no clue which of them are occupying most of your disk space. In this article, we will show some easy methods to check disk usage in Linux from both the terminal and the GUI application.

Monitor Disk Usage in Linux (2023)

Table of Contents

Check Disk Space Using the df Command
		
Display Disk Usage in Human Readable FormatDisplay Disk Occupancy of a Particular Type

Check Disk Usage using the du Command
		
Display Disk Usage in Human Readable FormatDisplay Disk Usage for a Particular DirectoryCompare Disk Usage of Two Directories


In [9]:
template = """You are an exceptional customer support chatbot that gently answer questions.

You know the following context information.

{chunks_formatted}

Answer to the following question from a customer. Use only information from the previous context information. Do not invent stuff.

Question: {query}

Answer:"""

prompt = PromptTemplate(
    input_variables=["chunks_formatted", "query"],
    template=template,
)

In [10]:
docs = db.similarity_search(query)
retrieved_chunks = [doc.page_content for doc in docs]

chunks_formatted = "\n\n".join(retrieved_chunks)
prompt_formatted = prompt.format(chunks_formatted=chunks_formatted, query=query)


llm = OpenAI(model="text-davinci-003", temperature=0)
answer = llm(prompt_formatted)
print(answer)

 You can check disk usage in Linux using the df command in the terminal or using the Disk Usage Analyzer Tool in the GUI. The df command will show you the current disk usage and the available disk space in Linux. The Disk Usage Analyzer Tool will show you a ring chart of the disk occupancy for all the folders and you can hover over any portion of the graph to see which folders are occupying the most disk space.
