# nous-hermes-llama2-13b (with given PDF)

In [1]:
pip install gpt4all pdfminer.six psutil


Note: you may need to restart the kernel to use updated packages.


In [2]:
# Install necessary packages
!pip install gpt4all pdfminer.six psutil

# Import required libraries
import psutil
from gpt4all import GPT4All
from pdfminer.high_level import extract_text

# Function to load the model
def load_model(model_path):
    print(f"Loading model from {model_path}...")
    model = GPT4All(model_path)
    print("Model loaded.")
    return model

# Function to perform inference and measure memory consumption
def infer_memory_usage(model, input_text):
    process = psutil.Process()
    mem_before = process.memory_info().rss / (1024 ** 2)  # Memory usage in MB before inference
    response = model.generate(input_text)
    mem_after = process.memory_info().rss / (1024 ** 2)  # Memory usage in MB after inference
    memory_usage = mem_after - mem_before
    print(f"Memory usage for input '{input_text[:20]}...': {memory_usage:.4f} MB")
    return memory_usage

# Function to extract text from a PDF file
def extract_text_from_pdf(pdf_path):
    text = extract_text(pdf_path)
    return text.split('\n')

# Complex prompts based on the PDF content
complex_prompts = [
    "Explain the purpose of the Research Integrity Policy at Flinders University and how it aligns with the Australian Code for the Responsible Conduct of Research.",
    "Discuss the scope of the Research Integrity Policy at Flinders University, including who it applies to and the types of research activities it covers.",
    "Describe the principles and responsibilities outlined in the Research Integrity Policy for researchers at Flinders University. How do these principles ensure responsible research conduct?"
   
]

# Main function to execute the benchmarking
def main():
    # Path to the PDF dataset file
    pdf_path = r'C:\Users\Priyank\Downloads\test.pdf'
    
    # Extract the dataset
    test_inputs = extract_text_from_pdf(pdf_path)
    
    # Filter out short or irrelevant lines
    test_inputs = [line for line in test_inputs if len(line) > 10]
    
    # Path to the local model file
    model_path = r'C:\Users\Priyank\Downloads\nous-hermes-llama2-13b.Q4_0.gguf'  # Ensure this path is correct
    
    # Load the model
    model = load_model(model_path)
    
    # Measure memory consumption for each complex prompt
    memory_usages = [infer_memory_usage(model, prompt) for prompt in complex_prompts]
    
    # Calculate average memory usage
    average_memory_usage = sum(memory_usages) / len(memory_usages)
    print(f"Average memory usage for Nous-Hermes-Llama2-13b.Q4_0.gguf: {average_memory_usage:.4f} MB")

# Execute the main function
main()


Loading model from C:\Users\Priyank\Downloads\nous-hermes-llama2-13b.Q4_0.gguf...
Model loaded.
Memory usage for input 'Explain the purpose ...': 6944.6953 MB
Memory usage for input 'Discuss the scope of...': 0.3477 MB
Memory usage for input 'Describe the princip...': -708.5625 MB
Average memory usage for Nous-Hermes-Llama2-13b.Q4_0.gguf: 2078.8268 MB


# nous-hermes-llama2-13b (with just prompts)

In [3]:
# Install necessary packages
!pip install gpt4all psutil

# Import required libraries
import psutil
from gpt4all import GPT4All

# Function to load the model
def load_model(model_path):
    print(f"Loading model from {model_path}...")
    model = GPT4All(model_path)
    print("Model loaded.")
    return model

# Function to perform inference and measure memory consumption
def infer_memory_usage(model, input_text):
    process = psutil.Process()
    mem_before = process.memory_info().rss / (1024 ** 2)  # Memory usage in MB before inference
    response = model.generate(input_text)
    mem_after = process.memory_info().rss / (1024 ** 2)  # Memory usage in MB after inference
    memory_usage = mem_after - mem_before
    print(f"Memory usage for input '{input_text[:20]}...': {memory_usage:.4f} MB")
    return memory_usage

# Complex prompts
complex_prompts = [
    "Explain the purpose of the Research Integrity Policy at Flinders University and how it aligns with the Australian Code for the Responsible Conduct of Research.",
    "Discuss the scope of the Research Integrity Policy at Flinders University, including who it applies to and the types of research activities it covers.",
    "Describe the principles and responsibilities outlined in the Research Integrity Policy for researchers at Flinders University. How do these principles ensure responsible research conduct?"
]

# Main function to execute the benchmarking
def main():
    # Path to the local model file
    model_path = r'C:\Users\Priyank\Downloads\nous-hermes-llama2-13b.Q4_0.gguf'  # Ensure this path is correct
    
    # Load the model
    model = load_model(model_path)
    
    # Measure memory consumption for each complex prompt
    memory_usages = [infer_memory_usage(model, prompt) for prompt in complex_prompts]
    
    # Calculate average memory usage
    average_memory_usage = sum(memory_usages) / len(memory_usages)
    print(f"Average memory usage for Nous-Hermes-Llama2-13b.Q4_0.gguf: {average_memory_usage:.4f} MB")

# Execute the main function
main()


Loading model from C:\Users\Priyank\Downloads\nous-hermes-llama2-13b.Q4_0.gguf...
Model loaded.
Memory usage for input 'Explain the purpose ...': 6906.4961 MB
Memory usage for input 'Discuss the scope of...': 0.2852 MB
Memory usage for input 'Describe the princip...': 0.4609 MB
Average memory usage for Nous-Hermes-Llama2-13b.Q4_0.gguf: 2302.4141 MB


# gpt4all-13b-snoozy-Q4_0 (with just PDF)

In [4]:
# Install necessary packages
!pip install gpt4all pdfminer.six psutil

# Import required libraries
import psutil
from gpt4all import GPT4All
from pdfminer.high_level import extract_text

# Function to load the model
def load_model(model_path):
    print(f"Loading model from {model_path}...")
    model = GPT4All(model_path)
    print("Model loaded.")
    return model

# Function to perform inference and measure memory consumption
def infer_memory_usage(model, input_text):
    process = psutil.Process()
    mem_before = process.memory_info().rss / (1024 ** 2)  # Memory usage in MB before inference
    response = model.generate(input_text)
    mem_after = process.memory_info().rss / (1024 ** 2)  # Memory usage in MB after inference
    memory_usage = mem_after - mem_before
    print(f"Memory usage for input '{input_text[:20]}...': {memory_usage:.4f} MB")
    return memory_usage

# Function to extract text from a PDF file
def extract_text_from_pdf(pdf_path):
    text = extract_text(pdf_path)
    return text.split('\n')

# Complex prompts based on the PDF content
complex_prompts = [
    "Explain the purpose of the Research Integrity Policy at Flinders University and how it aligns with the Australian Code for the Responsible Conduct of Research.",
    "Discuss the scope of the Research Integrity Policy at Flinders University, including who it applies to and the types of research activities it covers.",
    "Describe the principles and responsibilities outlined in the Research Integrity Policy for researchers at Flinders University. How do these principles ensure responsible research conduct?"
   
]

# Main function to execute the benchmarking
def main():
    # Path to the PDF dataset file
    pdf_path = r'C:\Users\Priyank\Downloads\test.pdf'
    
    # Extract the dataset
    test_inputs = extract_text_from_pdf(pdf_path)
    
    # Filter out short or irrelevant lines
    test_inputs = [line for line in test_inputs if len(line) > 10]
    
    # Path to the local model file
    model_path = r'C:\Users\Priyank\Downloads\gpt4all-13b-snoozy-Q4_0.gguf'  # Ensure this path is correct
    
    # Load the model
    model = load_model(model_path)
    
    # Measure memory consumption for each complex prompt
    memory_usages = [infer_memory_usage(model, prompt) for prompt in complex_prompts]
    
    # Calculate average memory usage
    average_memory_usage = sum(memory_usages) / len(memory_usages)
    print(f"Average memory usage for gpt4all-13b-snoozy-Q4_0.gguf: {average_memory_usage:.4f} MB")

# Execute the main function
main()


Loading model from C:\Users\Priyank\Downloads\gpt4all-13b-snoozy-Q4_0.gguf...
Model loaded.
Memory usage for input 'Explain the purpose ...': 6918.0742 MB
Memory usage for input 'Discuss the scope of...': 0.5234 MB
Memory usage for input 'Describe the princip...': 0.4570 MB
Average memory usage for gpt4all-13b-snoozy-Q4_0.gguf: 2306.3516 MB


# gpt4all-13b-snoozy-Q4_0 (with just prompts)

In [5]:
# Install necessary packages
!pip install gpt4all psutil

# Import required libraries
import psutil
from gpt4all import GPT4All

# Function to load the model
def load_model(model_path):
    print(f"Loading model from {model_path}...")
    model = GPT4All(model_path)
    print("Model loaded.")
    return model

# Function to perform inference and measure memory consumption
def infer_memory_usage(model, input_text):
    process = psutil.Process()
    mem_before = process.memory_info().rss / (1024 ** 2)  # Memory usage in MB before inference
    response = model.generate(input_text)
    mem_after = process.memory_info().rss / (1024 ** 2)  # Memory usage in MB after inference
    memory_usage = mem_after - mem_before
    print(f"Memory usage for input '{input_text[:20]}...': {memory_usage:.4f} MB")
    return memory_usage

# Complex prompts
complex_prompts = [
    "Explain the purpose of the Research Integrity Policy at Flinders University and how it aligns with the Australian Code for the Responsible Conduct of Research.",
    "Discuss the scope of the Research Integrity Policy at Flinders University, including who it applies to and the types of research activities it covers.",
    "Describe the principles and responsibilities outlined in the Research Integrity Policy for researchers at Flinders University. How do these principles ensure responsible research conduct?"
]

# Main function to execute the benchmarking
def main():
    # Path to the local model file
    model_path = r'C:\Users\Priyank\Downloads\gpt4all-13b-snoozy-Q4_0.gguf'  # Ensure this path is correct
    
    # Load the model
    model = load_model(model_path)
    
    # Measure memory consumption for each complex prompt
    memory_usages = [infer_memory_usage(model, prompt) for prompt in complex_prompts]
    
    # Calculate average memory usage
    average_memory_usage = sum(memory_usages) / len(memory_usages)
    print(f"Average memory usage for gpt4all-13b-snoozy-Q4_0.gguf: {average_memory_usage:.4f} MB")

# Execute the main function
main()


Loading model from C:\Users\Priyank\Downloads\gpt4all-13b-snoozy-Q4_0.gguf...
Model loaded.
Memory usage for input 'Explain the purpose ...': 6940.6094 MB
Memory usage for input 'Discuss the scope of...': -5.7344 MB
Memory usage for input 'Describe the princip...': -702.3750 MB
Average memory usage for gpt4all-13b-snoozy-Q4_0.gguf: 2077.5000 MB


# mistral-7b-openorca (with given PDF)

In [6]:
# Install necessary packages
!pip install gpt4all pdfminer.six psutil

# Import required libraries
import psutil
from gpt4all import GPT4All
from pdfminer.high_level import extract_text

# Function to load the model
def load_model(model_path):
    print(f"Loading model from {model_path}...")
    model = GPT4All(model_path)
    print("Model loaded.")
    return model

# Function to perform inference and measure memory consumption
def infer_memory_usage(model, input_text):
    process = psutil.Process()
    mem_before = process.memory_info().rss / (1024 ** 2)  # Memory usage in MB before inference
    response = model.generate(input_text)
    mem_after = process.memory_info().rss / (1024 ** 2)  # Memory usage in MB after inference
    memory_usage = mem_after - mem_before
    print(f"Memory usage for input '{input_text[:20]}...': {memory_usage:.4f} MB")
    return memory_usage

# Function to extract text from a PDF file
def extract_text_from_pdf(pdf_path):
    text = extract_text(pdf_path)
    return text.split('\n')

# Complex prompts based on the PDF content
complex_prompts = [
    "Explain the purpose of the Research Integrity Policy at Flinders University and how it aligns with the Australian Code for the Responsible Conduct of Research.",
    "Discuss the scope of the Research Integrity Policy at Flinders University, including who it applies to and the types of research activities it covers.",
    "Describe the principles and responsibilities outlined in the Research Integrity Policy for researchers at Flinders University. How do these principles ensure responsible research conduct?"
   
]

# Main function to execute the benchmarking
def main():
    # Path to the PDF dataset file
    pdf_path = r'C:\Users\Priyank\Downloads\test.pdf'
    
    # Extract the dataset
    test_inputs = extract_text_from_pdf(pdf_path)
    
    # Filter out short or irrelevant lines
    test_inputs = [line for line in test_inputs if len(line) > 10]
    
    # Path to the local model file
    model_path = r'C:\Users\Priyank\Downloads\mistral-7b-openorca.gguf2.Q4_0.gguf'  # Ensure this path is correct
    
    # Load the model
    model = load_model(model_path)
    
    # Measure memory consumption for each complex prompt
    memory_usages = [infer_memory_usage(model, prompt) for prompt in complex_prompts]
    
    # Calculate average memory usage
    average_memory_usage = sum(memory_usages) / len(memory_usages)
    print(f"Average memory usage for mistral-7b-openorca.gguf2.Q4_0.gguf: {average_memory_usage:.4f} MB")

# Execute the main function
main()


Loading model from C:\Users\Priyank\Downloads\mistral-7b-openorca.gguf2.Q4_0.gguf...
Model loaded.
Memory usage for input 'Explain the purpose ...': 3851.3047 MB
Memory usage for input 'Discuss the scope of...': 0.0742 MB
Memory usage for input 'Describe the princip...': 0.0938 MB
Average memory usage for mistral-7b-openorca.gguf2.Q4_0.gguf: 1283.8242 MB


# mistral-7b-openorca (with just prompts)

In [7]:
# Install necessary packages
!pip install gpt4all psutil

# Import required libraries
import psutil
from gpt4all import GPT4All

# Function to load the model
def load_model(model_path):
    print(f"Loading model from {model_path}...")
    model = GPT4All(model_path)
    print("Model loaded.")
    return model

# Function to perform inference and measure memory consumption
def infer_memory_usage(model, input_text):
    process = psutil.Process()
    mem_before = process.memory_info().rss / (1024 ** 2)  # Memory usage in MB before inference
    response = model.generate(input_text)
    mem_after = process.memory_info().rss / (1024 ** 2)  # Memory usage in MB after inference
    memory_usage = mem_after - mem_before
    print(f"Memory usage for input '{input_text[:20]}...': {memory_usage:.4f} MB")
    return memory_usage

# Complex prompts
complex_prompts = [
    "Explain the purpose of the Research Integrity Policy at Flinders University and how it aligns with the Australian Code for the Responsible Conduct of Research.",
    "Discuss the scope of the Research Integrity Policy at Flinders University, including who it applies to and the types of research activities it covers.",
    "Describe the principles and responsibilities outlined in the Research Integrity Policy for researchers at Flinders University. How do these principles ensure responsible research conduct?"
]

# Main function to execute the benchmarking
def main():
    # Path to the local model file
    model_path = r'C:\Users\Priyank\Downloads\mistral-7b-openorca.gguf2.Q4_0.gguf'  # Ensure this path is correct
    
    # Load the model
    model = load_model(model_path)
    
    # Measure memory consumption for each complex prompt
    memory_usages = [infer_memory_usage(model, prompt) for prompt in complex_prompts]
    
    # Calculate average memory usage
    average_memory_usage = sum(memory_usages) / len(memory_usages)
    print(f"Average memory usage for mistral-7b-openorca.gguf2.Q4_0.gguf: {average_memory_usage:.4f} MB")

# Execute the main function
main()


Loading model from C:\Users\Priyank\Downloads\mistral-7b-openorca.gguf2.Q4_0.gguf...
Model loaded.
Memory usage for input 'Explain the purpose ...': 3851.3359 MB
Memory usage for input 'Discuss the scope of...': 0.0742 MB
Memory usage for input 'Describe the princip...': 0.0977 MB
Average memory usage for mistral-7b-openorca.gguf2.Q4_0.gguf: 1283.8359 MB


# gpt4all-falcon-newbpe (with given PDF)

In [8]:
# Install necessary packages
!pip install gpt4all pdfminer.six psutil

# Import required libraries
import psutil
from gpt4all import GPT4All
from pdfminer.high_level import extract_text

# Function to load the model
def load_model(model_path):
    print(f"Loading model from {model_path}...")
    model = GPT4All(model_path)
    print("Model loaded.")
    return model

# Function to perform inference and measure memory consumption
def infer_memory_usage(model, input_text):
    process = psutil.Process()
    mem_before = process.memory_info().rss / (1024 ** 2)  # Memory usage in MB before inference
    response = model.generate(input_text)
    mem_after = process.memory_info().rss / (1024 ** 2)  # Memory usage in MB after inference
    memory_usage = mem_after - mem_before
    print(f"Memory usage for input '{input_text[:20]}...': {memory_usage:.4f} MB")
    return memory_usage

# Function to extract text from a PDF file
def extract_text_from_pdf(pdf_path):
    text = extract_text(pdf_path)
    return text.split('\n')

# Complex prompts based on the PDF content
complex_prompts = [
    "Explain the purpose of the Research Integrity Policy at Flinders University and how it aligns with the Australian Code for the Responsible Conduct of Research.",
    "Discuss the scope of the Research Integrity Policy at Flinders University, including who it applies to and the types of research activities it covers.",
    "Describe the principles and responsibilities outlined in the Research Integrity Policy for researchers at Flinders University. How do these principles ensure responsible research conduct?"
   
]

# Main function to execute the benchmarking
def main():
    # Path to the PDF dataset file
    pdf_path = r'C:\Users\Priyank\Downloads\test.pdf'
    
    # Extract the dataset
    test_inputs = extract_text_from_pdf(pdf_path)
    
    # Filter out short or irrelevant lines
    test_inputs = [line for line in test_inputs if len(line) > 10]
    
    # Path to the local model file
    model_path = r'C:\Users\Priyank\Downloads\gpt4all-falcon-newbpe-q4_0.gguf'  # Ensure this path is correct
    
    # Load the model
    model = load_model(model_path)
    
    # Measure memory consumption for each complex prompt
    memory_usages = [infer_memory_usage(model, prompt) for prompt in complex_prompts]
    
    # Calculate average memory usage
    average_memory_usage = sum(memory_usages) / len(memory_usages)
    print(f"Average memory usage for gpt4all-falcon-newbpe-q4_0.gguf: {average_memory_usage:.4f} MB")

# Execute the main function
main()


Loading model from C:\Users\Priyank\Downloads\gpt4all-falcon-newbpe-q4_0.gguf...
Model loaded.
Memory usage for input 'Explain the purpose ...': 3840.9062 MB
Memory usage for input 'Discuss the scope of...': 0.5039 MB
Memory usage for input 'Describe the princip...': 0.3711 MB
Average memory usage for gpt4all-falcon-newbpe-q4_0.gguf: 1280.5938 MB


# gpt4all-falcon-newbpe (with just prompts)

In [9]:
# Install necessary packages
!pip install gpt4all psutil

# Import required libraries
import psutil
from gpt4all import GPT4All

# Function to load the model
def load_model(model_path):
    print(f"Loading model from {model_path}...")
    model = GPT4All(model_path)
    print("Model loaded.")
    return model

# Function to perform inference and measure memory consumption
def infer_memory_usage(model, input_text):
    process = psutil.Process()
    mem_before = process.memory_info().rss / (1024 ** 2)  # Memory usage in MB before inference
    response = model.generate(input_text)
    mem_after = process.memory_info().rss / (1024 ** 2)  # Memory usage in MB after inference
    memory_usage = mem_after - mem_before
    print(f"Memory usage for input '{input_text[:20]}...': {memory_usage:.4f} MB")
    return memory_usage

# Complex prompts
complex_prompts = [
    "Explain the purpose of the Research Integrity Policy at Flinders University and how it aligns with the Australian Code for the Responsible Conduct of Research.",
    "Discuss the scope of the Research Integrity Policy at Flinders University, including who it applies to and the types of research activities it covers.",
    "Describe the principles and responsibilities outlined in the Research Integrity Policy for researchers at Flinders University. How do these principles ensure responsible research conduct?"
]

# Main function to execute the benchmarking
def main():
    # Path to the local model file
    model_path = r'C:\Users\Priyank\Downloads\gpt4all-falcon-newbpe-q4_0.gguf'  # Ensure this path is correct
    
    # Load the model
    model = load_model(model_path)
    
    # Measure memory consumption for each complex prompt
    memory_usages = [infer_memory_usage(model, prompt) for prompt in complex_prompts]
    
    # Calculate average memory usage
    average_memory_usage = sum(memory_usages) / len(memory_usages)
    print(f"Average memory usage for gpt4all-falcon-newbpe-q4_0.gguf: {average_memory_usage:.4f} MB")

# Execute the main function
main()


Loading model from C:\Users\Priyank\Downloads\gpt4all-falcon-newbpe-q4_0.gguf...
Model loaded.
Memory usage for input 'Explain the purpose ...': 3860.7031 MB
Memory usage for input 'Discuss the scope of...': 0.3711 MB
Memory usage for input 'Describe the princip...': 0.1953 MB
Average memory usage for gpt4all-falcon-newbpe-q4_0.gguf: 1287.0898 MB
