In [1]:
from langchain.text_splitter import RecursiveCharacterTextSplitter # Import the specific text splitter

In [2]:
# Define the input text to be split. 📄
# This is a multi-paragraph string about space exploration and its benefits.
text = """
Space exploration has led to incredible scientific discoveries. From landing on the Moon to exploring Mars, humanity continues to push the boundaries of what’s possible beyond our planet.

These missions have not only expanded our knowledge of the universe but have also contributed to advancements in technology here on Earth. Satellite communications, GPS, and even certain medical imaging techniques trace their roots back to innovations driven by space programs.
"""

In [3]:
# Initialize the RecursiveCharacterTextSplitter. ✂️
# This is a sophisticated text splitter that attempts to split text using a list of characters
# recursively, trying to keep semantically related pieces of text together.
splitter = RecursiveCharacterTextSplitter(
    chunk_size=500,  # The maximum size of each text chunk (in characters).
                     # The splitter will aim for chunks of up to 500 characters.
    chunk_overlap=0, # The number of characters to overlap between consecutive chunks.
                     # An overlap of 0 means chunks will be completely distinct.
                     # A non-zero overlap helps maintain context across chunk boundaries.
)

In [4]:
# Perform the text splitting. 📝
# The `splitter.split_text(text)` method takes the input string and
# applies the recursive splitting logic, returning a list of smaller text strings (chunks).
chunks = splitter.split_text(text)

In [5]:
# Print the number of chunks created. 📏
# This shows how many segments the original text was divided into.
print(len(chunks))

1


In [6]:
# Print the actual content of each created chunk. 📊
# This will display each smaller piece of the original text.
print(chunks)

['Space exploration has led to incredible scientific discoveries. From landing on the Moon to exploring Mars, humanity continues to push the boundaries of what’s possible beyond our planet.\n\nThese missions have not only expanded our knowledge of the universe but have also contributed to advancements in technology here on Earth. Satellite communications, GPS, and even certain medical imaging techniques trace their roots back to innovations driven by space programs.']
