In [18]:
from langchain import PromptTemplate, LLMChain
from langchain.llms import LlamaCpp
from langchain.callbacks.manager import CallbackManager
from langchain.callbacks.streaming_stdout import StreamingStdOutCallbackHandler

In [19]:
# Callbacks support token-wise streaming
callback_manager = CallbackManager([StreamingStdOutCallbackHandler()])
# Verbose is required to pass to the callback manager

In [20]:
model_path = "../../../../../Models/llama-2-7b-chat.ggmlv3.q8_0.bin"

In [21]:
n_gpu_layers = 40  # Change this value based on your model and your GPU VRAM pool.
n_batch = 512  # Should be between 1 and n_ctx, consider the amount of VRAM in your GPU.
# Make sure the model path is correct for your system!
llm = LlamaCpp(
    model_path=model_path,
    n_gpu_layers=n_gpu_layers,
    n_batch=n_batch,
    input={"temperature": 0.75, "max_length": 2000, "top_p": 1},
    callback_manager=callback_manager,
    verbose=True,
)

llama.cpp: loading model from ../../../../../Models/llama-2-7b-chat.ggmlv3.q8_0.bin
llama_model_load_internal: format     = ggjt v3 (latest)
llama_model_load_internal: n_vocab    = 32000
llama_model_load_internal: n_ctx      = 512
llama_model_load_internal: n_embd     = 4096
llama_model_load_internal: n_mult     = 256
llama_model_load_internal: n_head     = 32
llama_model_load_internal: n_head_kv  = 32
llama_model_load_internal: n_layer    = 32
llama_model_load_internal: n_rot      = 128
llama_model_load_internal: n_gqa      = 1
llama_model_load_internal: rnorm_eps  = 1.0e-06
llama_model_load_internal: n_ff       = 11008
llama_model_load_internal: freq_base  = 10000.0
llama_model_load_internal: freq_scale = 1
llama_model_load_internal: ftype      = 7 (mostly Q8_0)
llama_model_load_internal: model size = 7B
llama_model_load_internal: ggml ctx size =    0.08 MB
llama_model_load_internal: mem required  = 7130.73 MB (+  256.00 MB per state)
llama_new_context_with_model: kv self size  =  25

In [22]:
template = """Question: {question}

Answer: Let's work this out in a step by step way to be sure we have the right answer."""

prompt = PromptTemplate(template=template, input_variables=["question"])

In [23]:
llm_chain = LLMChain(prompt=prompt, llm=llm)

In [24]:
question = "What is AI Safety?"

llm_chain.run(question)

 Here is how I will break down the question, "What is AI safety?" and explain it to you:
Step 1: Definition of Artificial Intelligence (AI)
* AI is a broader field that encompasses machine learning, natural language processing, computer vision, robotics, and more.
* It involves creating machines or computer programs that can perform tasks that typically require human intelligence, such as understanding language, recognizing images, making decisions, and solving problems.
Step 2: Definition of AI Safety
* AI safety refers to the practices and measures taken to ensure that AI systems are designed and used in ways that minimize harm to people, society, and the environment.
* It involves designing AI systems that are transparent, explainable, and controllable, and that can be safely integrated into various applications without causing unintended consequences.
Step 3: Importance of AI Safety
* As AI becomes more advanced and integrated into various aspects of life, the potential risks assoc


llama_print_timings:        load time = 14669.39 ms
llama_print_timings:      sample time =   164.10 ms /   256 runs   (    0.64 ms per token,  1560.04 tokens per second)
llama_print_timings: prompt eval time = 14669.35 ms /    35 tokens (  419.12 ms per token,     2.39 tokens per second)
llama_print_timings:        eval time = 110119.89 ms /   255 runs   (  431.84 ms per token,     2.32 tokens per second)
llama_print_timings:       total time = 125583.66 ms


' Here is how I will break down the question, "What is AI safety?" and explain it to you:\nStep 1: Definition of Artificial Intelligence (AI)\n* AI is a broader field that encompasses machine learning, natural language processing, computer vision, robotics, and more.\n* It involves creating machines or computer programs that can perform tasks that typically require human intelligence, such as understanding language, recognizing images, making decisions, and solving problems.\nStep 2: Definition of AI Safety\n* AI safety refers to the practices and measures taken to ensure that AI systems are designed and used in ways that minimize harm to people, society, and the environment.\n* It involves designing AI systems that are transparent, explainable, and controllable, and that can be safely integrated into various applications without causing unintended consequences.\nStep 3: Importance of AI Safety\n* As AI becomes more advanced and integrated into various aspects of life, the potential ri