In [None]:
from llama_index.readers.web import SimpleWebPageReader
from llama_index.core import VectorStoreIndex
from llama_index.llms.huggingface import HuggingFaceLLM
from dotenv import load_dotenv

load_dotenv()

url = "https://en.wikipedia.org/wiki/Myocardial_infarction"

def reader(urls: str) -> None:
    document = SimpleWebPageReader(html_to_text=True).load_data(urls=[url])
    
    # ✅ Check if data is being loaded
    print(f"Loaded {len(document)} documents")
    if len(document) == 0:
        raise ValueError("No data was loaded. Check the URL or network connection.")
    
    llm = HuggingFaceLLM(
    model_name="HuggingFaceH4/zephyr-7b-beta",
    tokenizer_name="HuggingFaceH4/zephyr-7b-beta",
    context_window=3900,
    max_new_tokens=256,
    generate_kwargs={"temperature": 0.7, "top_k": 50, "top_p": 0.95},
    # messages_to_prompt=messages_to_prompt,
    # completion_to_prompt=completion_to_prompt,
    device_map="auto",
)
    
    # ✅ Create the index correctly
    index = VectorStoreIndex.from_documents(documents=document)  # Remove extra ()
    query_engine = index.as_query_engine(llm=llm)
    
    response = query_engine.query("What is the best immediate treatment for myocardial infarction?")
    print(response)

reader(url)
