In [9]:
#!pip install unstructured selenium

In [19]:
from langchain.text_splitter import CharacterTextSplitter
from langchain.document_loaders import SeleniumURLLoader
from langchain import PromptTemplate
from langchain import LLMChain, PromptTemplate
#from langchain_openai import ChatOpenAI
from langchain.llms import Ollama
from langchain_community.embeddings import OllamaEmbeddings
from langchain_community.vectorstores import FAISS



In [None]:
# we'll use information from the following articles
urls = ['https://beebom.com/what-is-nft-explained/',
        'https://beebom.com/how-delete-spotify-account/',
        'https://beebom.com/how-download-gif-twitter/',
        'https://beebom.com/how-use-chatgpt-linux-terminal/',
        'https://beebom.com/how-delete-spotify-account/',
        'https://beebom.com/how-save-instagram-story-with-music/',
        'https://beebom.com/how-install-pip-windows/',
        'https://beebom.com/how-check-disk-usage-linux/']

In [7]:
# use the selenium scraper to load the documents
loader = SeleniumURLLoader(urls=urls)
docs_not_splitted = loader.load()

# we split the documents into smaller chunks 
text_splitter = CharacterTextSplitter(chunk_size=1000, chunk_overlap=0)
docs = text_splitter.split_documents(docs_not_splitted)



Created a chunk of size 1226, which is longer than the specified 1000


In [12]:
#set o modelo de embeddings
embeddings = OllamaEmbeddings(model="mxbai-embed-large")

#cria o vetor store
db = FAISS.from_documents(docs, embedding=embeddings)


In [13]:
# let's see the top relevant documents to a specific query
query = "how to check disk usage in linux?"
docs = db.similarity_search(query)
print(docs[0].page_content)


Home > Tech > How to Check Disk Usage in Linux (4 Methods)

How to Check Disk Usage in Linux (4 Methods)

Beebom Staff

Comments							
							
								0

Share

Copied

There may be times when you need to download some important files or transfer some photos to your Linux system, but face a problem of insufficient disk space. You head over to your file manager to delete the large files which you no longer require, but you have no clue which of them are occupying most of your disk space. In this article, we will show some easy methods to check disk usage in Linux from both the terminal and the GUI application.

Table of Contents

Display Disk Usage in Human Readable Format

Display Disk Occupancy of a Particular Type

Display Disk Usage in Human Readable Format

Display Disk Usage for a Particular Directory

Compare Disk Usage of Two Directories

Sorting Files based on File Size

Exclude Files Based on Their File Size

Exclude Files Based on their Types


In [14]:
# let's write a prompt for a customer support chatbot that
# answer questions using information extracted from our db

template = """You are an exceptional customer support chatbot that gently answer questions.
              You know the following context information.
              
              {chunks_formatted} 
              
              Answer to the following question from a customer. 
              Use only information from the previous context information. Do not invent stuff.

              Question: {query}Answer:"""

prompt = PromptTemplate(    
    input_variables = ["chunks_formatted", "query"],    
    template=template,)




In [15]:
# the full pipeline# user question
query = "How to check disk usage in linux?"

# retrieve relevant chunks
docs = db.similarity_search(query)
retrieved_chunks = [doc.page_content for doc in docs]

# format the prompt
chunks_formatted = "\n\n".join(retrieved_chunks)
prompt_formatted = prompt.format(chunks_formatted=chunks_formatted, query=query)

In [23]:
# Initialize language model
llm = Ollama(model='llama3:latest', temperature=0)

In [24]:
res = llm.invoke(prompt_formatted)
print(res)

According to the article, there are several methods to check disk usage in Linux. Here are four ways:

1. **Display Disk Usage in Human Readable Format**: You can use the `du` command with the `-h` flag to display the sizes in human-readable format like megabytes, gigabytes, etc.

Example: `du -h`

2. **Display Disk Occupancy of a Particular Type**: You can use the `df` command with options such as `-a`, `-h`, `-t`, or `-x` to display the disk usage of only the file system of a particular type.

Example: `df -h`

3. **Display Disk Usage for a Particular Directory**: You can use the `du` command with the `-s` flag and specify the directory name to view the disk usage for that specific folder.

Example: `du -s -h <directory_name>`

4. **Compare Disk Usage of Two Directories**: You can use the `du` command with multiple directory names to compare the disk usage of two or more directories.

Example: `du <options> <directory_1> <directory_2>`

Additionally, you can also check disk usage usi