Example gotten from
https://docs.llamaindex.ai/en/stable/getting_started/starter_example/

In [2]:
import os
import os.path
from llama_index.core import (
    VectorStoreIndex,
    SimpleDirectoryReader,
    StorageContext,
    load_index_from_storage,
)

## Index: Creating-Persisting or Loading
This uses `gpt-3.5-turbo` by default.

In [3]:
persist_dir = os.path.join(os.environ["PERSIST_DIR"], "paul_small")
if not os.path.exists((os.environ["PERSIST_DIR"]):
    # load the documents and create the index
    documents = SimpleDirectoryReader("data").load_data()
    index = VectorStoreIndex.from_documents(documents)
    # store it for later
    index.storage_context.persist(persist_dir=PERSIST_DIR)
else:
    # load the existing index
    storage_context = StorageContext.from_defaults(persist_dir=PERSIST_DIR)
    index = load_index_from_storage(storage_context)

In [7]:
persist_dir = os.path.join(os.environ["WORKDIR"], "persist_dir")
index.storage_context.persist(persist_dir)

DEBUG:fsspec.local:open file: /llamaindex-project/persist_dir/docstore.json
open file: /llamaindex-project/persist_dir/docstore.json
DEBUG:fsspec.local:open file: /llamaindex-project/persist_dir/index_store.json
open file: /llamaindex-project/persist_dir/index_store.json
DEBUG:fsspec.local:open file: /llamaindex-project/persist_dir/graph_store.json
open file: /llamaindex-project/persist_dir/graph_store.json
DEBUG:fsspec.local:open file: /llamaindex-project/persist_dir/default__vector_store.json
open file: /llamaindex-project/persist_dir/default__vector_store.json
DEBUG:fsspec.local:open file: /llamaindex-project/persist_dir/image__vector_store.json
open file: /llamaindex-project/persist_dir/image__vector_store.json


## Query your data

In [4]:
query_engine = index.as_query_engine()
response = query_engine.query("What programming language he used in college?")
print(response)

Fortran


## Logging for viewing events and queries

In [5]:
import logging
import sys

logging.basicConfig(stream=sys.stdout, level=logging.DEBUG)
logging.getLogger().addHandler(logging.StreamHandler(stream=sys.stdout))

In [6]:
query_engine = index.as_query_engine()
response = query_engine.query("What programming language he used in college?")
print(response)

DEBUG:openai._base_client:Request options: {'method': 'post', 'url': '/embeddings', 'files': None, 'post_parser': <function Embeddings.create.<locals>.parser at 0x7fff2373ba60>, 'json_data': {'input': ['What programming language he used in college?'], 'model': 'text-embedding-ada-002', 'encoding_format': 'base64'}}
Request options: {'method': 'post', 'url': '/embeddings', 'files': None, 'post_parser': <function Embeddings.create.<locals>.parser at 0x7fff2373ba60>, 'json_data': {'input': ['What programming language he used in college?'], 'model': 'text-embedding-ada-002', 'encoding_format': 'base64'}}
DEBUG:httpcore.connection:close.started
close.started
DEBUG:httpcore.connection:close.complete
close.complete
DEBUG:httpcore.connection:connect_tcp.started host='api.openai.com' port=443 local_address=None timeout=60.0 socket_options=None
connect_tcp.started host='api.openai.com' port=443 local_address=None timeout=60.0 socket_options=None
DEBUG:httpcore.connection:connect_tcp.complete ret