# nous-hermes (with just prompts)

In [7]:
pip install gpt4all pdfminer.six

Note: you may need to restart the kernel to use updated packages.


In [8]:
# Install necessary packages
!pip install gpt4all pdfminer.six

# Import required libraries
import time
from gpt4all import GPT4All
from pdfminer.high_level import extract_text

# Function to load the model
def load_model(model_path):
    print(f"Loading model from {model_path}...")
    model = GPT4All(model_path)
    print("Model loaded.")
    return model

# Function to perform inference and measure time
def infer(model, input_text):
    start_time = time.time()
    response = model.generate(input_text)
    end_time = time.time()
    inference_time = end_time - start_time
    print(f"Inference time for input '{input_text[:20]}...': {inference_time:.4f} seconds")
    return inference_time

# Complex prompts based on the PDF content
complex_prompts = [
    "Explain the purpose of the Research Integrity Policy at Flinders University and how it aligns with the Australian Code for the Responsible Conduct of Research.",
    "Discuss the scope of the Research Integrity Policy at Flinders University, including who it applies to and the types of research activities it covers.",
    "Describe the principles and responsibilities outlined in the Research Integrity Policy for researchers at Flinders University. How do these principles ensure responsible research conduct?"
    
]

# Main function to execute the benchmarking
def main():
    # Path to the local model file
    model_path = r'C:\Users\Priyank\Downloads\nous-hermes-llama2-13b.Q4_0.gguf'  # Ensure this path is correct
    
    # Load the model
    model = load_model(model_path)
    
    # Measure time efficiency for each complex prompt
    inference_times = [infer(model, prompt) for prompt in complex_prompts]
    
    # Calculate average inference time
    average_time = sum(inference_times) / len(inference_times)
    print(f"Average inference time for nous-hermes-llama2-13b.Q4_0.gguf: {average_time:.4f} seconds")

# Execute the main function
main()


Loading model from C:\Users\Priyank\Downloads\nous-hermes-llama2-13b.Q4_0.gguf...
Model loaded.
Inference time for input 'Explain the purpose ...': 149.8371 seconds
Inference time for input 'Discuss the scope of...': 146.9645 seconds
Inference time for input 'Describe the princip...': 150.3610 seconds
Average inference time for nous-hermes-llama2-13b.Q4_0.gguf: 149.0542 seconds


# nous-hermes (with given PDF)

In [9]:
# Install necessary packages
!pip install gpt4all pdfminer.six Levenshtein

# Importing the libraries which are required
import time
import Levenshtein
from gpt4all import GPT4All
from pdfminer.high_level import extract_text

# Function to load the model
def load_model(model_path):
    print(f"Loading model from {model_path}...")
    model = GPT4All(model_path)
    print("Model loaded.")
    return model

# Function to perform inference and measure time
def infer(model, input_text):
    start_time = time.time()
    response = model.generate(input_text)
    end_time = time.time()
    inference_time = end_time - start_time
    print(f"Inference time for input '{input_text[:20]}...': {inference_time:.4f} seconds")
    return response, inference_time

# Function to extract text from a PDF file
def extract_text_from_pdf(pdf_path):
    text = extract_text(pdf_path)
    return text

# Main function to run
def main():
    # Path to the local model file
    model_path = r'C:\Users\Priyank\Downloads\nous-hermes-llama2-13b.Q4_0.gguf'
    # Path to the PDF file
    pdf_path = r'C:\Users\Priyank\Downloads\test.pdf'
    
    # Loading the model
    model = load_model(model_path)
    
    # Extract text from the PDF
    pdf_text = extract_text_from_pdf(pdf_path)
    
    # Prompts which are based on the test PDF file
    complex_prompts = [
        "Explain the purpose of the Research Integrity Policy at Flinders University and how it aligns with the Australian Code for the Responsible Conduct of Research.",
        "Discuss the scope of the Research Integrity Policy at Flinders University, including who it applies to and the types of research activities it covers.",
        "Describe the principles and responsibilities outlined in the Research Integrity Policy for researchers at Flinders University. How do these principles ensure responsible research conduct?"
    ]
    
    # Measuring the time efficiency for each complex prompt
    inference_times = []
    for prompt in complex_prompts:
        response, inference_time = infer(model, prompt)
        inference_times.append(inference_time)
    
    # Calculating the average inference time
    average_time = sum(inference_times) / len(inference_times)
    print(f"Average inference time for Nous-Hermes-Llama2-13b.Q4_0.gguf: {average_time:.4f} seconds")

# Executing the main function
main()



Model loaded.
Inference time for input 'Explain the purpose ...': 126.7757 seconds
Inference time for input 'Discuss the scope of...': 102.7743 seconds
Inference time for input 'Describe the princip...': 116.8028 seconds
Average inference time for Nous-Hermes-Llama2-13b.Q4_0.gguf: 115.4509 seconds


# gpt4all-13b-snoozy (with just prompts)

In [10]:
# Install necessary packages
!pip install gpt4all pdfminer.six

# Import required libraries
import time
from gpt4all import GPT4All
from pdfminer.high_level import extract_text

# Function to load the model
def load_model(model_path):
    print(f"Loading model from {model_path}...")
    model = GPT4All(model_path)
    print("Model loaded.")
    return model

# Function to perform inference and measure time
def infer(model, input_text):
    start_time = time.time()
    response = model.generate(input_text)
    end_time = time.time()
    inference_time = end_time - start_time
    print(f"Inference time for input '{input_text[:20]}...': {inference_time:.4f} seconds")
    return inference_time

# Complex prompts based on the PDF content
complex_prompts = [
    "Explain the purpose of the Research Integrity Policy at Flinders University and how it aligns with the Australian Code for the Responsible Conduct of Research.",
    "Discuss the scope of the Research Integrity Policy at Flinders University, including who it applies to and the types of research activities it covers.",
    "Describe the principles and responsibilities outlined in the Research Integrity Policy for researchers at Flinders University. How do these principles ensure responsible research conduct?"
    
]

# Main function to execute the benchmarking
def main():
    # Path to the local model file
    model_path = r'C:\Users\Priyank\Downloads\gpt4all-13b-snoozy-Q4_0.gguf'  # Ensure this path is correct
    
    # Load the model
    model = load_model(model_path)
    
    # Measure time efficiency for each complex prompt
    inference_times = [infer(model, prompt) for prompt in complex_prompts]
    
    # Calculate average inference time
    average_time = sum(inference_times) / len(inference_times)
    print(f"Average inference time for gpt4all-13b-snoozy-Q4_0.gguf: {average_time:.4f} seconds")

# Execute the main function
main()


Loading model from C:\Users\Priyank\Downloads\gpt4all-13b-snoozy-Q4_0.gguf...
Model loaded.
Inference time for input 'Explain the purpose ...': 137.7567 seconds
Inference time for input 'Discuss the scope of...': 118.2463 seconds
Inference time for input 'Describe the princip...': 118.9502 seconds
Average inference time for gpt4all-13b-snoozy-Q4_0.gguf: 124.9844 seconds


# gpt4all-13b-snoozy (with given PDF)

In [11]:
# Install necessary packages
!pip install gpt4all pdfminer.six Levenshtein

# Importing the libraries which are required
import time
import Levenshtein
from gpt4all import GPT4All
from pdfminer.high_level import extract_text

# Function to load the model
def load_model(model_path):
    print(f"Loading model from {model_path}...")
    model = GPT4All(model_path)
    print("Model loaded.")
    return model

# Function to perform inference and measure time
def infer(model, input_text):
    start_time = time.time()
    response = model.generate(input_text)
    end_time = time.time()
    inference_time = end_time - start_time
    print(f"Inference time for input '{input_text[:20]}...': {inference_time:.4f} seconds")
    return response, inference_time

# Function to extract text from a PDF file
def extract_text_from_pdf(pdf_path):
    text = extract_text(pdf_path)
    return text

# Main function to run
def main():
    # Path to the local model file
    model_path = r'C:\Users\Priyank\Downloads\gpt4all-13b-snoozy-Q4_0.gguf'
    # Path to the PDF file
    pdf_path = r'C:\Users\Priyank\Downloads\test.pdf'
    
    # Loading the model
    model = load_model(model_path)
    
    # Extract text from the PDF
    pdf_text = extract_text_from_pdf(pdf_path)
    
    # Prompts which are based on the test PDF file
    complex_prompts = [
        "Explain the purpose of the Research Integrity Policy at Flinders University and how it aligns with the Australian Code for the Responsible Conduct of Research.",
        "Discuss the scope of the Research Integrity Policy at Flinders University, including who it applies to and the types of research activities it covers.",
        "Describe the principles and responsibilities outlined in the Research Integrity Policy for researchers at Flinders University. How do these principles ensure responsible research conduct?"
    ]
    
    # Measuring the time efficiency for each complex prompt
    inference_times = []
    for prompt in complex_prompts:
        response, inference_time = infer(model, prompt)
        inference_times.append(inference_time)
    
    # Calculating the average inference time
    average_time = sum(inference_times) / len(inference_times)
    print(f"Average inference time for gpt4all-13b-snoozy-Q4_0.gguf: {average_time:.4f} seconds")

# Executing the main function
main()


Loading model from C:\Users\Priyank\Downloads\gpt4all-13b-snoozy-Q4_0.gguf...
Model loaded.
Inference time for input 'Explain the purpose ...': 120.5451 seconds
Inference time for input 'Discuss the scope of...': 117.9724 seconds
Inference time for input 'Describe the princip...': 120.2035 seconds
Average inference time for gpt4all-13b-snoozy-Q4_0.gguf: 119.5737 seconds


# mistral-7b-openorca (with just prompts)

In [12]:
# Install necessary packages
!pip install gpt4all pdfminer.six

# Import required libraries
import time
from gpt4all import GPT4All
from pdfminer.high_level import extract_text

# Function to load the model
def load_model(model_path):
    print(f"Loading model from {model_path}...")
    model = GPT4All(model_path)
    print("Model loaded.")
    return model

# Function to perform inference and measure time
def infer(model, input_text):
    start_time = time.time()
    response = model.generate(input_text)
    end_time = time.time()
    inference_time = end_time - start_time
    print(f"Inference time for input '{input_text[:20]}...': {inference_time:.4f} seconds")
    return inference_time

# Complex prompts based on the PDF content
complex_prompts = [
    "Explain the purpose of the Research Integrity Policy at Flinders University and how it aligns with the Australian Code for the Responsible Conduct of Research.",
    "Discuss the scope of the Research Integrity Policy at Flinders University, including who it applies to and the types of research activities it covers.",
    "Describe the principles and responsibilities outlined in the Research Integrity Policy for researchers at Flinders University. How do these principles ensure responsible research conduct?"
    
]

# Main function to execute the benchmarking
def main():
    # Path to the local model file
    model_path = r'C:\Users\Priyank\Downloads\mistral-7b-openorca.gguf2.Q4_0.gguf'  # Ensure this path is correct
    
    # Load the model
    model = load_model(model_path)
    
    # Measure time efficiency for each complex prompt
    inference_times = [infer(model, prompt) for prompt in complex_prompts]
    
    # Calculate average inference time
    average_time = sum(inference_times) / len(inference_times)
    print(f"Average inference time for mistral-7b-openorca.gguf2.Q4_0.gguf: {average_time:.4f} seconds")

# Execute the main function
main()


Loading model from C:\Users\Priyank\Downloads\mistral-7b-openorca.gguf2.Q4_0.gguf...
Model loaded.
Inference time for input 'Explain the purpose ...': 20.3384 seconds
Inference time for input 'Discuss the scope of...': 8.3902 seconds
Inference time for input 'Describe the princip...': 8.6588 seconds
Average inference time for mistral-7b-openorca.gguf2.Q4_0.gguf: 12.4625 seconds


# mistral-7b-openorca (with given PDF)

In [13]:
# Install necessary packages
!pip install gpt4all pdfminer.six Levenshtein

# Importing the libraries which are required
import time
import Levenshtein
from gpt4all import GPT4All
from pdfminer.high_level import extract_text

# Function to load the model
def load_model(model_path):
    print(f"Loading model from {model_path}...")
    model = GPT4All(model_path)
    print("Model loaded.")
    return model

# Function to perform inference and measure time
def infer(model, input_text):
    start_time = time.time()
    response = model.generate(input_text)
    end_time = time.time()
    inference_time = end_time - start_time
    print(f"Inference time for input '{input_text[:20]}...': {inference_time:.4f} seconds")
    return response, inference_time

# Function to extract text from a PDF file
def extract_text_from_pdf(pdf_path):
    text = extract_text(pdf_path)
    return text

# Main function to run
def main():
    # Path to the local model file
    model_path = r'C:\Users\Priyank\Downloads\mistral-7b-openorca.gguf2.Q4_0.gguf'
    # Path to the PDF file
    pdf_path = r'C:\Users\Priyank\Downloads\test.pdf'
    
    # Loading the model
    model = load_model(model_path)
    
    # Extract text from the PDF
    pdf_text = extract_text_from_pdf(pdf_path)
    
    # Prompts which are based on the test PDF file
    complex_prompts = [
        "Explain the purpose of the Research Integrity Policy at Flinders University and how it aligns with the Australian Code for the Responsible Conduct of Research.",
        "Discuss the scope of the Research Integrity Policy at Flinders University, including who it applies to and the types of research activities it covers.",
        "Describe the principles and responsibilities outlined in the Research Integrity Policy for researchers at Flinders University. How do these principles ensure responsible research conduct?"
    ]
    
    # Measuring the time efficiency for each complex prompt
    inference_times = []
    for prompt in complex_prompts:
        response, inference_time = infer(model, prompt)
        inference_times.append(inference_time)
    
    # Calculating the average inference time
    average_time = sum(inference_times) / len(inference_times)
    print(f"Average inference time for mistral-7b-openorca.gguf2.Q4_0.gguf: {average_time:.4f} seconds")

# Executing the main function
main()



Model loaded.
Inference time for input 'Explain the purpose ...': 10.1479 seconds
Inference time for input 'Discuss the scope of...': 8.5242 seconds
Inference time for input 'Describe the princip...': 8.6150 seconds
Average inference time for mistral-7b-openorca.gguf2.Q4_0.gguf: 9.0957 seconds


# gpt4all-falcon-newbpe (with just prompts)

In [14]:
# Install necessary packages
!pip install gpt4all pdfminer.six

# Import required libraries
import time
from gpt4all import GPT4All
from pdfminer.high_level import extract_text

# Function to load the model
def load_model(model_path):
    print(f"Loading model from {model_path}...")
    model = GPT4All(model_path)
    print("Model loaded.")
    return model

# Function to perform inference and measure time
def infer(model, input_text):
    start_time = time.time()
    response = model.generate(input_text)
    end_time = time.time()
    inference_time = end_time - start_time
    print(f"Inference time for input '{input_text[:20]}...': {inference_time:.4f} seconds")
    return inference_time

# Complex prompts based on the PDF content
complex_prompts = [
    "Explain the purpose of the Research Integrity Policy at Flinders University and how it aligns with the Australian Code for the Responsible Conduct of Research.",
    "Discuss the scope of the Research Integrity Policy at Flinders University, including who it applies to and the types of research activities it covers.",
    "Describe the principles and responsibilities outlined in the Research Integrity Policy for researchers at Flinders University. How do these principles ensure responsible research conduct?"
    
]

# Main function to execute the benchmarking
def main():
    # Path to the local model file
    model_path = r'C:\Users\Priyank\Downloads\gpt4all-falcon-newbpe-q4_0.gguf'  # Ensure this path is correct
    
    # Load the model
    model = load_model(model_path)
    
    # Measure time efficiency for each complex prompt
    inference_times = [infer(model, prompt) for prompt in complex_prompts]
    
    # Calculate average inference time
    average_time = sum(inference_times) / len(inference_times)
    print(f"Average inference time for gpt4all-falcon-newbpe-q4_0.gguf: {average_time:.4f} seconds")

# Execute the main function
main()


Loading model from C:\Users\Priyank\Downloads\gpt4all-falcon-newbpe-q4_0.gguf...
Model loaded.
Inference time for input 'Explain the purpose ...': 72.5124 seconds
Inference time for input 'Discuss the scope of...': 63.5614 seconds
Inference time for input 'Describe the princip...': 62.5283 seconds
Average inference time for gpt4all-falcon-newbpe-q4_0.gguf: 66.2007 seconds


# gpt4all-falcon-newbpe (with given PDF)

In [15]:
# Install necessary packages
!pip install gpt4all pdfminer.six Levenshtein

# Importing the libraries which are required
import time
import Levenshtein
from gpt4all import GPT4All
from pdfminer.high_level import extract_text

# Function to load the model
def load_model(model_path):
    print(f"Loading model from {model_path}...")
    model = GPT4All(model_path)
    print("Model loaded.")
    return model

# Function to perform inference and measure time
def infer(model, input_text):
    start_time = time.time()
    response = model.generate(input_text)
    end_time = time.time()
    inference_time = end_time - start_time
    print(f"Inference time for input '{input_text[:20]}...': {inference_time:.4f} seconds")
    return response, inference_time

# Function to extract text from a PDF file
def extract_text_from_pdf(pdf_path):
    text = extract_text(pdf_path)
    return text

# Main function to run
def main():
    # Path to the local model file
    model_path = r'C:\Users\Priyank\Downloads\gpt4all-falcon-newbpe-q4_0.gguf'
    # Path to the PDF file
    pdf_path = r'C:\Users\Priyank\Downloads\test.pdf'
    
    # Loading the model
    model = load_model(model_path)
    
    # Extract text from the PDF
    pdf_text = extract_text_from_pdf(pdf_path)
    
    # Prompts which are based on the test PDF file
    complex_prompts = [
        "Explain the purpose of the Research Integrity Policy at Flinders University and how it aligns with the Australian Code for the Responsible Conduct of Research.",
        "Discuss the scope of the Research Integrity Policy at Flinders University, including who it applies to and the types of research activities it covers.",
        "Describe the principles and responsibilities outlined in the Research Integrity Policy for researchers at Flinders University. How do these principles ensure responsible research conduct?"
    ]
    
    # Measuring the time efficiency for each complex prompt
    inference_times = []
    for prompt in complex_prompts:
        response, inference_time = infer(model, prompt)
        inference_times.append(inference_time)
    
    # Calculating the average inference time
    average_time = sum(inference_times) / len(inference_times)
    print(f"Average inference time for gpt4all-falcon-newbpe-q4_0.gguf: {average_time:.4f} seconds")

# Executing the main function
main()


Loading model from C:\Users\Priyank\Downloads\gpt4all-falcon-newbpe-q4_0.gguf...
Model loaded.
Inference time for input 'Explain the purpose ...': 62.8141 seconds
Inference time for input 'Discuss the scope of...': 62.3117 seconds
Inference time for input 'Describe the princip...': 62.9707 seconds
Average inference time for gpt4all-falcon-newbpe-q4_0.gguf: 62.6988 seconds
