# Semantic split


In [36]:
from langchain_experimental.text_splitter import SemanticChunker
from langchain_huggingface import HuggingFaceEmbeddings

# Load sentence-transformers model
embeddings = HuggingFaceEmbeddings(
    model_name="sentence-transformers/all-MiniLM-L6-v2"
)

# Use in SemanticChunker
text_splitter = SemanticChunker(
    embeddings,
    breakpoint_threshold_type="standard_deviation",
    breakpoint_threshold_amount=0.2
)

In [37]:
sample = """
Farmers were working hard in the fields, preparing the soil and planting seeds for the next season. The sun was bright, and the air smelled of earth and fresh grass. The Indian Premier League (IPL) is the biggest cricket league in the world. People all over the world watch the matches and cheer for their favourite teams.

Space is very important for us. It helps us understand our place in the universe and how we can explore it. The moon is a fascinating celestial body that has captivated human imagination for centuries. It is the Earth's only natural satellite and has a significant impact on our planet, influencing tides and providing light at night. 

"""

docs = text_splitter.create_documents([sample])



In [38]:
len(docs)

4

In [39]:
docs

[Document(metadata={}, page_content='\nFarmers were working hard in the fields, preparing the soil and planting seeds for the next season.'),
 Document(metadata={}, page_content='The sun was bright, and the air smelled of earth and fresh grass. The Indian Premier League (IPL) is the biggest cricket league in the world. People all over the world watch the matches and cheer for their favourite teams.'),
 Document(metadata={}, page_content='Space is very important for us.'),
 Document(metadata={}, page_content="It helps us understand our place in the universe and how we can explore it. The moon is a fascinating celestial body that has captivated human imagination for centuries. It is the Earth's only natural satellite and has a significant impact on our planet, influencing tides and providing light at night. ")]

In [40]:
for x in docs:
    print(x.page_content)


Farmers were working hard in the fields, preparing the soil and planting seeds for the next season.
The sun was bright, and the air smelled of earth and fresh grass. The Indian Premier League (IPL) is the biggest cricket league in the world. People all over the world watch the matches and cheer for their favourite teams.
Space is very important for us.
It helps us understand our place in the universe and how we can explore it. The moon is a fascinating celestial body that has captivated human imagination for centuries. It is the Earth's only natural satellite and has a significant impact on our planet, influencing tides and providing light at night. 
