# LangChain Data Loader

```shell
pip install langchain-community beautifulsoup4
```

In [1]:
from langchain_openai import ChatOpenAI
from langchain_ollama.chat_models import ChatOllama
from os import getenv
from dotenv import load_dotenv

load_dotenv()

llm = ChatOpenAI(
    openai_api_key=getenv("OPENROUTER_API_KEY"),
    openai_api_base="https://openrouter.ai/api/v1",
    model="meta-llama/llama-3.2-3b-instruct:free",
    temperature=0.5,
    # max_tokens=512,

)
# llm = ChatOllama(model='qwen2.5:0.5b', temperature=0.5, max_tokens=512)

result = llm.invoke("Hello, how are you today?")
print(result.content)

I'm just a language model, so I don't have emotions or feelings like humans do, but I'm functioning properly and ready to help you with any questions or tasks you have. How can I assist you today?


# CSV Data Loader



In [8]:
from langchain.document_loaders import CSVLoader
# https://support.staffbase.com/hc/en-us/article_attachments/360009197031/username.csv
loader = CSVLoader('data/sample.csv')

data = loader.load()

print(type(data))

print(data[0])

print(data[1].page_content)

<class 'list'>
page_content='Username; Identifier;First name;Last name: booker12;9012;Rachel;Booker' metadata={'source': 'data/sample.csv', 'row': 0}
Username; Identifier;First name;Last name: grey07;2070;Laura;Grey


# Web Loaders
## HTML Data Loader
``` shell
pip install beautifulsoup4
```

In [14]:
from langchain.document_loaders import BSHTMLLoader
from pprint import pp, pprint
# http://help.websiteos.com/websiteos/example_of_a_simple_html_page.htm

loader = BSHTMLLoader('data/sample.html')

data = loader.load()

print(type(data))

print(data)

print(data[0].page_content)

<class 'list'>
[Document(metadata={'source': 'data/sample.html', 'title': 'HTML Element Selection Example'}, page_content='\n\n\n\nHTML Element Selection Example\n\n\n\n\nHTML Element Selection Demo\n\n\nSection 1\nSection 2\nSection 3\n\n\n\n\n\nSection 1\nThis is a highlighted paragraph.\nClick Me\n\n\nSection 2\n\nItem 1\nItem 2\nItem 3\n\n\nSubmit\n\n\nSection 3\n\nBox 1\nBox 2\nBox 3\n\n\n\n\nCreated by Your Name. Follow me on Twitter.\n\n\n')]




HTML Element Selection Example




HTML Element Selection Demo


Section 1
Section 2
Section 3





Section 1
This is a highlighted paragraph.
Click Me


Section 2

Item 1
Item 2
Item 3


Submit


Section 3

Box 1
Box 2
Box 3




Created by Your Name. Follow me on Twitter.





# PDF Data Loader
## PyPDF Data Loader
``` shell
pip install pypdf
```

In [21]:
from langchain.document_loaders import PyPDFLoader

loader = PyPDFLoader('data/constitution.pdf')

data = loader.load()


print(type(data))

# print(data)






<class 'list'>


## PyPDFDirectoryLoader Data Loader



In [None]:
from langchain_community.document_loaders import PyPDFDirectoryLoader


## PDFMinerLoader

In [None]:
from langchain_community.document_loaders import PDFMinerLoader


## PyMuPDFLoader

In [None]:
from langchain_community.document_loaders import PyMuPDFLoader


## PDFPlumberLoader

In [None]:
from langchain_community.document_loaders import PDFPlumberLoader
