https://huggingface.co/CompendiumLabs/bge-large-en-v1.5-gguf

- https://pypi.org/project/llama-cpp-python/
- https://pypi.org/project/scikit-learn/
- https://pypi.org/project/beautifulsoup4/

requirements.txt ->
llama-cpp-python
scikit-learn 
scipy 
numpy

In [1]:
# !pip install -q llama-cpp-python
# !pip install -q scikit-learn scipy numpy
# !pip install -q beautifulsoup4

In [2]:
!ls

archive
bge-large-en-v1.5-f32.gguf
bge-large-en-v1.5-q4_k_m.gguf
embedding_model_llama_cpp_search_match_v10.ipynb
embedding_model_llama_cpp_search_match_v9.ipynb
embedding_model_llama_cpp_test.ipynb
env
requirements.txt


In [3]:
model_path = "bge-large-en-v1.5-f32.gguf"

In [4]:
text_to_embed = "hello world"

In [5]:
from llama_cpp import Llama
model = Llama(model_path, embedding=True)


llama_model_loader: loaded meta data with 23 key-value pairs and 389 tensors from bge-large-en-v1.5-f32.gguf (version GGUF V3 (latest))
llama_model_loader: Dumping metadata keys/values. Note: KV overrides do not apply in this output.
llama_model_loader: - kv   0:                       general.architecture str              = bert
llama_model_loader: - kv   1:                               general.name str              = bge-large-en-v1.5
llama_model_loader: - kv   2:                           bert.block_count u32              = 24
llama_model_loader: - kv   3:                        bert.context_length u32              = 512
llama_model_loader: - kv   4:                      bert.embedding_length u32              = 1024
llama_model_loader: - kv   5:                   bert.feed_forward_length u32              = 4096
llama_model_loader: - kv   6:                  bert.attention.head_count u32              = 16
llama_model_loader: - kv   7:          bert.attention.layer_norm_epsilon f32   

In [6]:
embed = model.embed(text_to_embed)


llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =      87.70 ms /     4 tokens (   21.93 ms per token,    45.61 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =      90.53 ms /     5 tokens


In [7]:
## inspection to see if pipeline is working
# print(embed)

In [8]:
embedding1 = model.embed("flower")
embedding2 = model.embed("blossom")


llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =      89.73 ms /     3 tokens (   29.91 ms per token,    33.44 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =      90.78 ms /     4 tokens

llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =      77.53 ms /     3 tokens (   25.84 ms per token,    38.70 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =      78.36 ms /     4 tokens


In [9]:
#############################################
# get_vector function to modularize pipeline
#############################################
def get_vector(text_to_vectorize):
    return model.embed(text_to_vectorize)

In [10]:
# step 1: embed the search-phrase
# step 2: embed each text
# step 3: get scores
# step 4: evaluates if score is succss or fail
# step 5: if success: do stuff with text, else: move on

In [11]:


from sklearn.metrics.pairwise import cosine_similarity

def cosine_similarity_distance(embedding1, embedding2, boolean=False, threshold=0.6):
    """
    Cosine Similarity: This is a common method for measuring the similarity
    between two vectors. It measures the cosine of the angle between
    two vectors and the result is a value between -1 and 1.
    A value of 1 means the vectors are identical,
    0 means they are orthogonal (or completely dissimilar),
    and -1 means they are diametrically opposed.

    if not surprisingly, this looks solid: gold standard?
    """
    # Assuming embedding1 and embedding2 are your embeddings
    similarity = cosine_similarity([embedding1], [embedding2])

    similarity = similarity[0][0]
    
    if not boolean:
        # print(similarity)
        return similarity

    else:
        if similarity < threshold:
            return False

        else:
            return True


from scipy.spatial.distance import euclidean

def euclidean_distance(embedding1, embedding2, boolean=False, threshold=0.5):
    """
    Euclidean Distance: This is another common method for measuring
     the similarity between two vectors.
     It calculates the straight-line distance between two points in a space.
     The smaller the distance, the more similar the vectors.
    """
    # Assuming embedding1 and embedding2 are your embeddings
    similarity = 1 / (1 + euclidean(embedding1, embedding2))
    
    if not boolean:
        # print(similarity)
        return similarity

    else:
        if similarity < threshold:
            return False

        else:
            return True



import numpy as np

def normalized_dot_product(embedding1, embedding2, boolean=False, threshold=0.6):
    """
    Dot Product: This is a simple method that calculates
    the sum of the products of the corresponding entries of the
    two sequences of numbers. If the vectors are normalized,
    the dot product is equal to the cosine similarity.

    0.5 ok? seems good
    """
    # Assuming embedding1 and embedding2 are your embeddings
    dot_product = np.dot(embedding1, embedding2)
    normalized_dot_product = dot_product / (np.linalg.norm(embedding1) * np.linalg.norm(embedding2))

    similarity = normalized_dot_product
    
    if not boolean:
        # print(similarity)
        return similarity

    else:
        if similarity < threshold:
            return False

        else:
            return True


from scipy.spatial.distance import cityblock

def manhattan_distance(embedding1, embedding2, boolean=False, threshold=0.0024):
    """
    Manhattan Distance: This is a measure of the distance between
    two vectors in a grid-based system.
    It calculates the sum of the absolute differences of their coordinates.
    """
    # Assuming embedding1 and embedding2 are your embeddings
    similarity = 1 / (1 + cityblock(embedding1, embedding2))


    if not boolean:
        # print(similarity)
        return similarity

    else:
        if similarity < threshold:
            return False

        else:
            return True



from scipy.stats import pearsonr

def pearson_correlation(embedding1, embedding2, boolean=False, threshold=0.6):
    """
    Pearson Correlation: This is a measure of the linear correlation
    between two vectors. It ranges from -1 (perfectly negatively correlated)
     to 1 (perfectly positively correlated).

    maybe decent around 0.6?
    """
    
    # Assuming embedding1 and embedding2 are your embeddings
    similarity, _ = pearsonr(embedding1, embedding2)

    if not boolean:
        # print(similarity)
        return similarity

    else:
        if similarity < threshold:
            return False

        else:
            return True



from scipy.stats import spearmanr

def spearmans_rank_correlation(embedding1, embedding2, boolean=False, threshold=0.6):
    """
    Spearman's Rank Correlation: This is a non-parametric
     measure of the monotonicity of the relationship between
     two datasets. Unlike the Pearson correlation, the Spearman
      correlation does not assume that the relationship between
       the two variables is linear.

    more strict measure?
    """
    
    # Assuming embedding1 and embedding2 are your embeddings
    similarity, _ = spearmanr(embedding1, embedding2)


    if not boolean:
        # print(similarity)
        return similarity

    else:
        if similarity < threshold:
            return False

        else:
            return True


from scipy.stats import kendalltau
def kendalls_rank_correlation(embedding1, embedding2, boolean=False, threshold=0.7):
    
    """
    Kendall's Rank Correlation: This is another non-parametric
    measure of the ordinal association between two variables.
    It is a measure of the correspondence between two rankings.

    0.3 may match the subject generally
    0.5 may most closely match meaning
    """
    
    # Assuming embedding1 and embedding2 are your embeddings
    similarity, _ = kendalltau(embedding1, embedding2)

    if not boolean:
        # print(similarity)
        return similarity

    else:
        if similarity < threshold:
            return False

        else:
            return True



from scipy.spatial.distance import minkowski


def minkowski_distance(embedding1, embedding2, boolean=False, threshold=0.055):
    """
    Minkowski Distance: This is a generalization of
    both the Euclidean distance and the Manhattan distance.
    It is defined as the p-th root of the sum of the p-th powers
    of the differences of the coordinates.
    When p=1, this is the Manhattan distance,
    and when p=2, this is the Euclidean distance.
    """
    # Assuming embedding1 and embedding2 are your embeddings
    similarity = 1 / (1 + minkowski(embedding1, embedding2, p=2))

    if not boolean:
        # print(similarity)
        return similarity

    else:
        if similarity < threshold:
            return False

        else:
            return True



from scipy.spatial.distance import chebyshev
def chebyshev_distance(embedding1, embedding2, boolean=False, threshold=0.4):
    """
    Chebyshev Distance: This is a measure of the distance between
    two vectors in a vector space.
    It is the maximum of the absolute differences of their coordinates.
    """
    
    # Assuming embedding1 and embedding2 are your embeddings
    similarity = 1 / (1 + chebyshev(embedding1, embedding2))

    if not boolean:
        # print(similarity)
        return similarity

    else:
        if similarity < threshold:
            return False

        else:
            return True



import numpy as np
from scipy.spatial.distance import mahalanobis
from numpy.linalg import inv

def mahalanobis_distance(embedding1, embedding2, boolean=False, threshold=0.415):
    """Mahalanobis Distance: This is a measure of the distance between 
    a point P and a distribution D, introduced by P. C. Mahalanobis in 1936.
    It is a multivariate generalization of the Euclidean distance.
    It is based on correlations between dimensions of the data, 
    and thus takes into account the structure of the data.
    """

    # Assuming embedding1 and embedding2 are your vectors
    data = np.array([embedding1, embedding2])

    # Calculate the covariance matrix with a small regularization term
    cov = np.cov(data, rowvar=False) + np.eye(data.shape[1])# * 1e-6

    # Calculate the Mahalanobis distance
    distance = mahalanobis(embedding1, embedding2, inv(cov))

    # Calculate the similarity score
    similarity = 1 / (1 + distance)

    if not boolean:
        # print(similarity)
        return similarity

    else:
        if similarity < threshold:
            return False

        else:
            return True




from scipy.spatial.distance import braycurtis
def bray_curtis_distance_dissimilarity(embedding1, embedding2, boolean=False, threshold=0.75):
    """Bray-Curtis Distance: This is a measure of dissimilarity
    between two vectors. It is used in ecology to compare species
    composition in different samples. It is defined as the sum of
    the absolute differences between the vectors, divided by the sum of their sums.

    0.75 is maybe a stricker-yes

    but total no is still .6+
    """
    
    # Assuming embedding1 and embedding2 are your embeddings
    similarity = 1 / (1 + braycurtis(embedding1, embedding2))

    if not boolean:
        # print(similarity)
        return similarity

    else:
        if similarity < threshold:
            return False

        else:
            return True



from scipy.spatial.distance import canberra
def canberra_distance(embedding1, embedding2, boolean=False, threshold=0.002):
    """
    dissimilarity
    Canberra Distance: This is a measure of the dissimilarity
    between two vectors. It is defined as the sum of the absolute
    differences between the vectors, divided by the sum of their absolute values.
    """
    # Assuming embedding1 and embedding2 are your embeddings
    similarity = 1 / (1 + canberra(embedding1, embedding2))

    if not boolean:
        # print(similarity)
        return similarity

    else:
        if similarity < threshold:
            return False

        else:
            return True




from scipy.stats import pearsonr
def correlation_distance_dissimilarity_measure(embedding1, embedding2, boolean=False, threshold=0.7):
    """
    dissimilarity
    Correlation Distance: This is a measure of the dissimilarity
    between two vectors. It is defined as 1 - the absolute value of
    the Pearson correlation coefficient between the vectors.

    even no is hight... maybe .7 ok?
    """
    # Assuming embedding1 and embedding2 are your embeddings
    correlation, _ = pearsonr(embedding1, embedding2)
    similarity = 1 / (1 + (1 - abs(correlation)))

    if not boolean:
        # print(similarity)
        return similarity

    else:
        if similarity < threshold:
            return False

        else:
            return True




from scipy.spatial.distance import sqeuclidean
def squared_euclidean_distance_dissimilarity_measure(embedding1, embedding2, boolean=False, threshold=0.005):
    """
    dissimilarity
    Squared Euclidean Distance: This is a measure of the dissimilarity
    between two vectors. It is defined as the sum of the squared differences
    between the vectors. It is similar to the Euclidean distance,
    but it does not take the square root, which can make it faster to compute.
    """
    # Assuming embedding1 and embedding2 are your embeddings
    similarity = 1 / (1 + sqeuclidean(embedding1, embedding2))

    if not boolean:
        # print(similarity)
        return similarity

    else:
        if similarity < threshold:
            return False

        else:
            return True


from scipy.spatial.distance import hamming
def hamming_distance_dissimilarity_measure(embedding1, embedding2):
    """
    Hamming Distance: This is a measure of the minimum number
    of substitutions required to change one vector into the other.
    It is used in information theory to measure the difference between
    two binary vectors.
    """
    # Assuming embedding1 and embedding2 are your binary vectors
    similarity = 1 / (1 + hamming(embedding1, embedding2))

    if not boolean:
        # print(similarity)
        return similarity

    else:
        if similarity < threshold:
            return False

        else:
            return True



# """
# not for vectors
# dissimilarity
# Jensen-Shannon Distance: This is a measure of the dissimilarity
# between two probability distributions. It is defined as the square root
# of the Jensen-Shannon divergence. It is a symmetric and smooth measure
# of dissimilarity that is always greater than or equal to 0.
# """
# from scipy.spatial.distance import jensenshannon
# import numpy as np
# def jensen_shannon_distance_dissimilarity_measure(embedding1, embedding2):
#     # Assuming embedding1 and embedding2 are your probability distributions
#     # Compute the average of the two distributions
#     average = 0.5 * np.add(embedding1, embedding2)
#     # Compute the Jensen-Shannon divergence
#     jsd = 0.5 * jensenshannon(embedding1, average) + 0.5 * jensenshannon(embedding2, average)
#     # Compute the Jensen-Shannon distance
#     dissimilarity = np.sqrt(jsd)
#     return dissimilarity



# """
# not for vectors
# dissimilarity
# Kullback-Leibler Divergence:
# This is a measure of the dissimilarity between two probability distributions.
#  It is not symmetric, meaning that the divergence from
#  distribution P to distribution Q is not
#  necessarily the same as the divergence from Q to P.
# """
# from scipy.special import kl_div
# def kullback_leibler_distance_dissimilarity_measure(embedding1, embedding2):
#     # Assuming embedding1 and embedding2 are your probability distributions
#     # Compute the Kullback-Leibler divergence
#     kld = np.sum(kl_div(embedding1, embedding2))
#     return kld



from scipy.stats import wasserstein_distance
def total_variation_distance_dissimilarity_measure(embedding1, embedding2, boolean=False, threshold=0.97):
    """
    dissimilarity
    Total Variation Distance: This is a measure of the dissimilarity
    between two probability distributions.
    It is defined as half the sum of the absolute differences
    between the corresponding probabilities in the two distributions.

    all scores high, maybe .97 is strict enough?
    """
    # Assuming embedding1 and embedding2 are your probability distributions
    similarity = 1 / (1 + wasserstein_distance(embedding1, embedding2))

    if not boolean:
        # print(similarity)
        return similarity

    else:
        if similarity < threshold:
            return False

        else:
            return True








In [12]:

# step 1: embed the search-phrase
# step 2: embed each text
# step 3: get scores
# step 4: evaluates if score is succss or fail
# step 5: if success: do stuff with text, else: move on

# arxiv inspector


import requests
from bs4 import BeautifulSoup
import json

##########################################
# Make comparison phrase and vectorize it
##########################################
comparison_phrase = "I will not be coming to dinner."

embedding1 = get_vector(comparison_phrase)



articles = [
    "I will not be coming to dinner.",
    "I should not attend supper", 
    "When you dine tonight I will not be there",
    "at the time of evening nutrition, my attendance will be lacking,",

    "For lunch people go to eat food.",
    "I will be eating eggs for breakfast", 
    
    "dogs dance",
    "rocks",
    "velocity",
]

# List to hold all article data
article_data = []

for article in articles:

    extracted_article_string = article


    ##################################
    # Do embedding search here:
    ##################################

    embedding2 = get_vector(extracted_article_string)


    ##################################
    # Do basic embedding search here:
    ##################################

    # List of functions
    list_of_comparison_function_tuples = [
        (cosine_similarity_distance, "cosine_similarity_distance"),
        (correlation_distance_dissimilarity_measure, "correlation_distance_dissimilarity_measure"),
        (pearson_correlation, "pearson_correlation"),
        # (mahalanobis_distance, "mahalanobis_distance"),
        (canberra_distance, "canberra_distance"),
        (euclidean_distance, "euclidean_distance"),
        (manhattan_distance, "manhattan_distance"),
        (minkowski_distance, "minkowski_distance"),
        (squared_euclidean_distance_dissimilarity_measure, "squared_euclidean_distance_dissimilarity_measure"),
        (chebyshev_distance, "chebyshev_distance"),
        (kendalls_rank_correlation, "kendalls_rank_correlation"),
        (bray_curtis_distance_dissimilarity, "bray_curtis_distance_dissimilarity"),
        (normalized_dot_product, "normalized_dot_product"),
        (spearmans_rank_correlation, "spearmans_rank_correlation"),
        (total_variation_distance_dissimilarity_measure, "total_variation_distance_dissimilarity_measure"),
    ]

    # Arguments to pass to the functions
    arguments = (embedding1, embedding2, True)

    print(f"For {comparison_phrase} vs. {extracted_article_string[:100]}")

    list_of_boolean_scores = []
    
    # Iterate through the functions and call each one with the arguments
    for this_function_tuple in list_of_comparison_function_tuples:
        function_pointer = this_function_tuple[0]
        raw_score = function_pointer(*arguments)

        # print(raw_score)
        list_of_boolean_scores.append(raw_score)

    
    ratio_score = list_of_boolean_scores.count(True)

    print(f"{ratio_score} / {len(list_of_boolean_scores)}")

    # input("PointBreak")
    # input("PointBreak")




llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =      48.14 ms /    10 tokens (    4.81 ms per token,   207.73 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =      48.70 ms /    11 tokens

llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =      50.70 ms /    10 tokens (    5.07 ms per token,   197.25 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =      52.07 ms /    11 tokens

llama_print_timings:     

For I will not be coming to dinner. vs. I will not be coming to dinner.
14 / 14
For I will not be coming to dinner. vs. I should not attend supper
12 / 14
For I will not be coming to dinner. vs. When you dine tonight I will not be there
12 / 14
For I will not be coming to dinner. vs. at the time of evening nutrition, my attendance will be lacking,



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =      50.16 ms /    10 tokens (    5.02 ms per token,   199.37 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =      51.41 ms /    11 tokens

llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =      63.90 ms /     9 tokens (    7.10 ms per token,   140.86 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =      65.84 ms /    10 tokens

llama_print_timings:     

7 / 14
For I will not be coming to dinner. vs. For lunch people go to eat food.
0 / 14
For I will not be coming to dinner. vs. I will be eating eggs for breakfast
0 / 14
For I will not be coming to dinner. vs. dogs dance
0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =      47.40 ms /     3 tokens (   15.80 ms per token,    63.29 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =      48.17 ms /     4 tokens

llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =      45.37 ms /     3 tokens (   15.12 ms per token,    66.12 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =      46.48 ms /     4 tokens


For I will not be coming to dinner. vs. rocks
0 / 14
For I will not be coming to dinner. vs. velocity
0 / 14


In [13]:

# step 1: embed the search-phrase
# step 2: embed each text
# step 3: get scores
# step 4: evaluates if score is succss or fail
# step 5: if success: do stuff with text, else: move on

# arxiv inspector


import requests
from bs4 import BeautifulSoup
import json

##########################################
# Make comparison phrase and vectorize it
##########################################
comparison_phrase = "computer vision"
# comparison_phrase = "cyber security"

embedding1 = get_vector(comparison_phrase)



articles = [
    """
    Principles of Designing Robust Remote Face Anti-Spoofing Systems Xiang Xu, Tianchen Zhao, Zheng Zhang, Zhihua Li, Jon Wu, Alessandro Achille, Mani Srivastava Comments: Under review Subjects: Computer Vision and Pattern Recognition (cs.CV); Cryptography and Security (cs.CR)
Protecting digital identities of human face from various attack vectors is paramount, and face anti-spoofing plays a crucial role in this endeavor. Current approaches primarily focus on detecting spoofing attempts within individual frames to detect presentation attacks. However, the emergence of hyper-realistic generative models capable of real-time operation has heightened the risk of digitally generated attacks. In light of these evolving threats, this paper aims to address two key aspects. First, it sheds light on the vulnerabilities of state-of-the-art face anti-spoofing methods against digital attacks. Second, it presents a comprehensive taxonomy of common threats encountered in face anti-spoofing systems. Through a series of experiments, we demonstrate the limitations of current face anti-spoofing detection techniques and their failure to generalize to novel digital attack scenarios. Notably, the existing models struggle with digital injection attacks including adversarial noise, realistic deepfake attacks, and digital replay attacks. To aid in the design and implementation of robust face anti-spoofing systems resilient to these emerging vulnerabilities, the paper proposes key design principles from model accuracy and robustness to pipeline robustness and even platform robustness. Especially, we suggest to implement the proactive face anti-spoofing system using active sensors to significant reduce the risks for unseen attack vectors and improve the user experience.
    """,

    """
    Stateless and Non-Interactive Order-Preserving Encryption for Outsourced Databases through Subtractive Homomorphism
Dongfang Zhao
Subjects: Cryptography and Security (cs.CR); Databases (cs.DB)

Order-preserving encryption (OPE) has been extensively studied for more than two decades in the context of outsourced databases because OPE is a key enabling technique to allow the outsourced database servers to sort encrypted tuples in order to build indexes, complete range queries, and so forth. The state-of-the-art OPE schemes require (i) a stateful client -- implying that the client manages the local storage of some mapping between plaintexts and ciphertexts, and/or (ii) the interaction between the client and the server during the query. In production systems, however, the above assumptions do not always hold (not to mention performance overhead): In the first case, the storage requirement could exceed the capability of the client; In the second case, the clients may not be accessible when the server executes a query involving sort or comparison.
This paper proposes a new OPE scheme that works for stateless clients and requires no client-server interaction during the queries. The key idea of our proposed protocol is to leverage the underlying additive property of a homomorphic encryption scheme such that the sign of the difference between two plaintexts can be revealed by some algebraic operations with an evaluation key. We will demonstrate the correctness and security of the proposed protocol in this short paper; the implementation and experimental results will be presented in an extended report. 
    """,
    """
    Npix2Cpix: A GAN-based Image-to-Image Translation Network with Retrieval-Classification Integration for Watermark Retrieval from Historical Document Images
Utsab Saha, Sawradip Saha, Shaikh Anowarul Fattah, Mohammad Saquib
Subjects: Computer Vision and Pattern Recognition (cs.CV)

The identification and restoration of ancient watermarks have long been a major topic in codicology and history. Classifying historical documents based on watermarks can be difficult due to the diversity of watermarks, crowded and noisy samples, multiple modes of representation, and minor distinctions between classes and intra-class changes. This paper proposes a U-net-based conditional generative adversarial network (GAN) to translate noisy raw historical watermarked images into clean, handwriting-free images with just watermarks. Considering its ability to perform image translation from degraded (noisy) pixels to clean pixels, the proposed network is termed as Npix2Cpix. Instead of employing directly degraded watermarked images, the proposed network uses image-to-image translation using adversarial learning to create clutter and handwriting-free images for restoring and categorizing the watermarks for the first time. In order to learn the mapping from input noisy image to output clean image, the generator and discriminator of the proposed U-net-based GAN are trained using two separate loss functions, each of which is based on the distance between images. After using the proposed GAN to pre-process noisy watermarked images, Siamese-based one-shot learning is used to classify watermarks. According to experimental results on a large-scale historical watermark dataset, extracting watermarks from tainted images can result in high one-shot classification accuracy. The qualitative and quantitative evaluation of the retrieved watermarks illustrates the effectiveness of the proposed approach. 
        """,
    """
    A Geometric View of Data Complexity: Efficient Local Intrinsic Dimension Estimation with Diffusion Models
Hamidreza Kamkari, Brendan Leigh Ross, Rasa Hosseinzadeh, Jesse C. Cresswell, Gabriel Loaiza-Ganem
Comments: 10 pages
Subjects: Machine Learning (cs.LG); Artificial Intelligence (cs.AI); Machine Learning (stat.ML)

High-dimensional data commonly lies on low-dimensional submanifolds, and estimating the local intrinsic dimension (LID) of a datum -- i.e. the dimension of the submanifold it belongs to -- is a longstanding problem. LID can be understood as the number of local factors of variation: the more factors of variation a datum has, the more complex it tends to be. Estimating this quantity has proven useful in contexts ranging from generalization in neural networks to detection of out-of-distribution data, adversarial examples, and AI-generated text. The recent successes of deep generative models present an opportunity to leverage them for LID estimation, but current methods based on generative models produce inaccurate estimates, require more than a single pre-trained model, are computationally intensive, or do not exploit the best available deep generative models, i.e. diffusion models (DMs). In this work, we show that the Fokker-Planck equation associated with a DM can provide a LID estimator which addresses all the aforementioned deficiencies. Our estimator, called FLIPD, is compatible with all popular DMs, and outperforms existing baselines on LID estimation benchmarks. We also apply FLIPD on natural images where the true LID is unknown. Compared to competing estimators, FLIPD exhibits a higher correlation with non-LID measures of complexity, better matches a qualitative assessment of complexity, and is the only estimator to remain tractable with high-resolution images at the scale of Stable Diffusion.
    """,

    "For lunch people go to eat food.",
    "I will be eating eggs for breakfast", 
    
    "dogs dance",
    "table of contents",
    "rocks",
    "velocity",
]

# List to hold all article data
article_data = []

for article in articles:

    extracted_article_string = article


    ##################################
    # Do embedding search here:
    ##################################

    embedding2 = get_vector(extracted_article_string)


    ##################################
    # Do basic embedding search here:
    ##################################

    list_of_comparison_function_tuples = [
        (cosine_similarity_distance, "cosine_similarity_distance"),
        (correlation_distance_dissimilarity_measure, "correlation_distance_dissimilarity_measure"),
        (pearson_correlation, "pearson_correlation"),
        # (mahalanobis_distance, "mahalanobis_distance"),
        (canberra_distance, "canberra_distance"),
        (euclidean_distance, "euclidean_distance"),
        (manhattan_distance, "manhattan_distance"),
        (minkowski_distance, "minkowski_distance"),
        (squared_euclidean_distance_dissimilarity_measure, "squared_euclidean_distance_dissimilarity_measure"),
        (chebyshev_distance, "chebyshev_distance"),
        (kendalls_rank_correlation, "kendalls_rank_correlation"),
        (bray_curtis_distance_dissimilarity, "bray_curtis_distance_dissimilarity"),
        (normalized_dot_product, "normalized_dot_product"),
        (spearmans_rank_correlation, "spearmans_rank_correlation"),
        (total_variation_distance_dissimilarity_measure, "total_variation_distance_dissimilarity_measure"),
    ]


    # Arguments to pass to the functions
    arguments = (embedding1, embedding2, True)

    print(f"For {comparison_phrase} vs. {extracted_article_string[:100]}")

    list_of_boolean_scores = []
    
    # Iterate through the functions and call each one with the arguments
    for this_function_tuple in list_of_comparison_function_tuples:
        function_pointer = this_function_tuple[0]
        raw_score = function_pointer(*arguments)

        # print(raw_score)
        list_of_boolean_scores.append(raw_score)

    
    ratio_score = list_of_boolean_scores.count(True)

    print(f"{ratio_score} / {len(list_of_boolean_scores)}")

    # input("PointBreak")




llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =      49.72 ms /     4 tokens (   12.43 ms per token,    80.46 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =      50.63 ms /     5 tokens

llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     691.87 ms /   349 tokens (    1.98 ms per token,   504.43 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     693.24 ms /   350 tokens


For computer vision vs. 
    Principles of Designing Robust Remote Face Anti-Spoofing Systems Xiang Xu, Tianchen Zhao, Zheng
6 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     538.97 ms /   329 tokens (    1.64 ms per token,   610.42 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     541.63 ms /   330 tokens


For computer vision vs. 
    Stateless and Non-Interactive Order-Preserving Encryption for Outsourced Databases through Subt
0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     684.65 ms /   382 tokens (    1.79 ms per token,   557.95 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     687.46 ms /   383 tokens


For computer vision vs. 
    Npix2Cpix: A GAN-based Image-to-Image Translation Network with Retrieval-Classification Integra
7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     761.09 ms /   402 tokens (    1.89 ms per token,   528.19 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     764.10 ms /   403 tokens

llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =      44.86 ms /    10 tokens (    4.49 ms per token,   222.90 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =      46.96 ms /    11 tokens

llama_print_timings:     

For computer vision vs. 
    A Geometric View of Data Complexity: Efficient Local Intrinsic Dimension Estimation with Diffus
7 / 14
For computer vision vs. For lunch people go to eat food.
0 / 14
For computer vision vs. I will be eating eggs for breakfast
0 / 14
For computer vision vs. dogs dance
0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =      46.44 ms /     5 tokens (    9.29 ms per token,   107.67 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =      47.19 ms /     6 tokens

llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =      48.29 ms /     3 tokens (   16.10 ms per token,    62.12 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =      49.33 ms /     4 tokens

llama_print_timings:     

For computer vision vs. table of contents
0 / 14
For computer vision vs. rocks
0 / 14
For computer vision vs. velocity
2 / 14


In [14]:

# # step 1: embed the search-phrase
# # step 2: embed each text
# # step 3: get scores
# # step 4: evaluates if score is succss or fail
# # step 5: if success: do stuff with text, else: move on

# # arxiv inspector


# import requests
# from bs4 import BeautifulSoup
# import json

# ##########################################
# # Make comparison phrase and vectorize it
# ##########################################
# comparison_phrase = "Neural Networks"

# embedding1 = get_vector(comparison_phrase)


# # Make a request to the website
# r = requests.get('https://arxiv.org/list/cs/new')
# soup = BeautifulSoup(r.text, 'html.parser')

# # Find all the articles
# articles = soup.find_all('div', class_='meta')

# # List to hold all article data
# article_data = []

# for article in articles:
#     # Extract the title
#     title = article.find('div', class_='list-title mathjax').text.strip().replace('Title:', '')

#     # Extract the abstract
#     abstract = article.find('p', class_='mathjax').text.strip()

#     # Extract the link
#     link_element = article.find('a', title='Abstract')
#     if link_element:
#         link = 'https://arxiv.org' + link_element['href']
#     else:
#         link = ''


#     extracted_article_string = title + " " + abstract


#     ##################################
#     # Do embedding search here:
#     ##################################

#     embedding2 = get_vector(extracted_article_string)


#     ##################################
#     # Do basic embedding search here:
#     ##################################

#     # List of functions
#     list_of_comparison_functions = [
#         cosine_similarity_distance,
#         euclidean_distance,
#         dot_product,
#         manhattan_distance,
#         pearson_correlation,
#         spearmans_rank_correlation,
#         kendalls_rank_correlation,
#         minkowski_distance,
#         chebyshev_distance,
#         mahalanobis_distance,
#         bray_curtis_distance_dissimilarity,
#         canberra_distance,
#         correlation_distance_dissimilarity_measure,
#         squared_euclidean_distance_dissimilarity_measure,
#         hamming_distance_dissimilarity_measure,
#         jensen_shannon_distance_dissimilarity_measure,
#         kullback_leibler_distance_dissimilarity_measure,
#         total_variation_distance_dissimilarity_measure,
#         ]

#     # Arguments to pass to the functions
#     arguments = (embedding1, embedding2)

#     print(f"\n\n For {comparison_phrase} vs. {extracted_article_string[:200]}")
    
#     # Iterate through the functions and call each one with the arguments
#     for this_function in list_of_comparison_functions:
#         raw_score = this_function(*arguments)

#         print(raw_score)

#     input("PointBreak")


In [None]:

# step 1: embed the search-phrase
# step 2: embed each text
# step 3: get scores
# step 4: evaluates if score is succss or fail
# step 5: if success: do stuff with text, else: move on

# arxiv inspector


import requests
from bs4 import BeautifulSoup
import json

##########################################
# Make comparison phrase and vectorize it
##########################################
comparison_phrase = "computer vision and image enhancement"
# comparison_phrase = "cyber security"
comparison_phrase = "natural language processing"


embedding1 = get_vector(comparison_phrase)


# Make a request to the website
r = requests.get('https://arxiv.org/list/cs/new')
soup = BeautifulSoup(r.text, 'html.parser')

# Find all the articles
articles = soup.find_all('div', class_='meta')

# List to hold all article data
article_data = []

for article in articles:
    # Extract the title
    title = article.find('div', class_='list-title mathjax').text.strip().replace('Title:', '')

    # Extract the abstract
    abstract = article.find('p', class_='mathjax').text.strip()

    # Extract the link
    link_element = article.find('a', title='Abstract')
    if link_element:
        link = 'https://arxiv.org' + link_element['href']
    else:
        link = ''

    # Extract the subjects
    subjects_element = article.find('div', class_='list-subjects')
    if subjects_element:
        subjects = subjects_element.text.strip().replace('Subjects:', '').split(';')
        subjects = [subject.strip() for subject in subjects]
    else:
        subjects = []


    extracted_article_string = title + " " + abstract


    ##################################
    # Do embedding search here:
    ##################################

    embedding2 = get_vector(extracted_article_string)

    ##################################
    # Do basic embedding search here:
    ##################################

    list_of_comparison_function_tuples = [
        (cosine_similarity_distance, "cosine_similarity_distance"),
        (correlation_distance_dissimilarity_measure, "correlation_distance_dissimilarity_measure"),
        (pearson_correlation, "pearson_correlation"),
        # (mahalanobis_distance, "mahalanobis_distance"),
        (canberra_distance, "canberra_distance"),
        (euclidean_distance, "euclidean_distance"),
        (manhattan_distance, "manhattan_distance"),
        (minkowski_distance, "minkowski_distance"),
        (squared_euclidean_distance_dissimilarity_measure, "squared_euclidean_distance_dissimilarity_measure"),
        (chebyshev_distance, "chebyshev_distance"),
        (kendalls_rank_correlation, "kendalls_rank_correlation"),
        (bray_curtis_distance_dissimilarity, "bray_curtis_distance_dissimilarity"),
        (normalized_dot_product, "normalized_dot_product"),
        (spearmans_rank_correlation, "spearmans_rank_correlation"),
        (total_variation_distance_dissimilarity_measure, "total_variation_distance_dissimilarity_measure"),
    ]


    # Arguments to pass to the functions
    arguments = (embedding1, embedding2, True)

    # print(f"For {comparison_phrase} vs. {extracted_article_string}")

    list_of_boolean_scores = []
    
    # Iterate through the functions and call each one with the arguments
    for this_function_tuple in list_of_comparison_function_tuples:
        function_pointer = this_function_tuple[0]
        raw_score = function_pointer(*arguments)

        # print(raw_score)
        list_of_boolean_scores.append(raw_score)

    
    ratio_score = list_of_boolean_scores.count(True)

    print(f"{ratio_score} / {len(list_of_boolean_scores)}")

    # input("PointBreak")

    decimal_percent_true = ratio_score / len(list_of_boolean_scores)
    
    # target_score_decimal_percent = 0.5
    target_score_decimal_percent = 5 / len(list_of_boolean_scores)

    # Check if the abstract contains any of the keywords
    if decimal_percent_true >= target_score_decimal_percent:


        # Append the data to the list
        article_data.append({
            'title': title,
            'abstract': abstract,
            'link': link,
            'subjects': subjects,
        })





# Posix UTC Seconds
# make readable time
from datetime import datetime, UTC
date_time = datetime.now(UTC)
clean_timestamp = date_time.strftime('%Y-%m-%d__%H%M%S%f')



# Save the data to a JSON file
with open(f'articles_{clean_timestamp}.json', 'w') as f:
    json.dump(article_data, f)

# Create an HTML file
html = '<html><body>'
for article in article_data:
    html += f'<h2><a href="{article["link"]}">{article["title"]}</a></h2>'
    html += f'<p>{article["abstract"]}</p>'
    html += f'<p>Subjects: {", ".join(article["subjects"])}</p>'

html += '</body></html>'

# Save the HTML to a file
with open(f'articles{clean_timestamp}.html', 'w') as f:
    f.write(html)




llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =      53.95 ms /     5 tokens (   10.79 ms per token,    92.67 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =      54.85 ms /     6 tokens

llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     590.96 ms /   331 tokens (    1.79 ms per token,   560.11 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     592.55 ms /   332 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     518.86 ms /   238 tokens (    2.18 ms per token,   458.70 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     520.64 ms /   239 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     398.36 ms /   225 tokens (    1.77 ms per token,   564.82 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     400.43 ms /   226 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     691.08 ms /   362 tokens (    1.91 ms per token,   523.81 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     693.53 ms /   363 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     369.72 ms /   186 tokens (    1.99 ms per token,   503.09 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     371.38 ms /   187 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     642.20 ms /   354 tokens (    1.81 ms per token,   551.23 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     644.68 ms /   355 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     321.70 ms /   171 tokens (    1.88 ms per token,   531.56 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     324.09 ms /   172 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     439.45 ms /   260 tokens (    1.69 ms per token,   591.64 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     441.32 ms /   261 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     395.43 ms /   206 tokens (    1.92 ms per token,   520.95 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     397.50 ms /   207 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     384.89 ms /   212 tokens (    1.82 ms per token,   550.81 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     387.01 ms /   213 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     552.26 ms /   274 tokens (    2.02 ms per token,   496.15 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     554.55 ms /   275 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     752.22 ms /   376 tokens (    2.00 ms per token,   499.86 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     755.12 ms /   377 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     623.79 ms /   340 tokens (    1.83 ms per token,   545.06 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     626.15 ms /   341 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     454.12 ms /   241 tokens (    1.88 ms per token,   530.69 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     457.14 ms /   242 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     628.84 ms /   344 tokens (    1.83 ms per token,   547.04 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     631.20 ms /   345 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     566.97 ms /   307 tokens (    1.85 ms per token,   541.48 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     570.09 ms /   308 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     464.87 ms /   246 tokens (    1.89 ms per token,   529.18 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     467.13 ms /   247 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     501.97 ms /   278 tokens (    1.81 ms per token,   553.82 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     503.94 ms /   279 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     410.68 ms /   226 tokens (    1.82 ms per token,   550.31 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     413.11 ms /   227 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     659.62 ms /   348 tokens (    1.90 ms per token,   527.58 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     661.96 ms /   349 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     489.17 ms /   288 tokens (    1.70 ms per token,   588.75 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     491.70 ms /   289 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     348.37 ms /   186 tokens (    1.87 ms per token,   533.92 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     349.89 ms /   187 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     596.59 ms /   328 tokens (    1.82 ms per token,   549.80 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     598.30 ms /   329 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     324.00 ms /   169 tokens (    1.92 ms per token,   521.61 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     326.77 ms /   170 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     439.24 ms /   223 tokens (    1.97 ms per token,   507.69 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     442.15 ms /   224 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     406.42 ms /   167 tokens (    2.43 ms per token,   410.91 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     408.36 ms /   168 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     363.14 ms /   212 tokens (    1.71 ms per token,   583.79 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     364.21 ms /   213 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     339.14 ms /   191 tokens (    1.78 ms per token,   563.19 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     341.19 ms /   192 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =    1394.62 ms /   266 tokens (    5.24 ms per token,   190.73 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =    1397.09 ms /   267 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     498.38 ms /   203 tokens (    2.46 ms per token,   407.32 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     501.10 ms /   204 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     578.00 ms /   219 tokens (    2.64 ms per token,   378.89 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     580.38 ms /   220 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     570.25 ms /   240 tokens (    2.38 ms per token,   420.87 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     572.91 ms /   241 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     524.19 ms /   224 tokens (    2.34 ms per token,   427.33 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     526.80 ms /   225 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     638.45 ms /   254 tokens (    2.51 ms per token,   397.84 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     640.88 ms /   255 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     662.38 ms /   278 tokens (    2.38 ms per token,   419.70 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     664.75 ms /   279 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     570.45 ms /   232 tokens (    2.46 ms per token,   406.70 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     572.46 ms /   233 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     315.30 ms /   144 tokens (    2.19 ms per token,   456.71 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     317.19 ms /   145 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     757.85 ms /   320 tokens (    2.37 ms per token,   422.25 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     760.49 ms /   321 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     596.79 ms /   265 tokens (    2.25 ms per token,   444.04 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     598.97 ms /   266 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     657.93 ms /   284 tokens (    2.32 ms per token,   431.65 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     660.29 ms /   285 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     533.47 ms /   148 tokens (    3.60 ms per token,   277.43 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     535.57 ms /   149 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     545.75 ms /   217 tokens (    2.51 ms per token,   397.62 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     547.39 ms /   218 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     447.30 ms /   194 tokens (    2.31 ms per token,   433.71 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     448.67 ms /   195 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     900.76 ms /   365 tokens (    2.47 ms per token,   405.21 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     902.53 ms /   366 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     727.28 ms /   305 tokens (    2.38 ms per token,   419.37 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     728.95 ms /   306 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     574.70 ms /   245 tokens (    2.35 ms per token,   426.31 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     576.01 ms /   246 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     321.93 ms /   141 tokens (    2.28 ms per token,   437.98 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     323.13 ms /   142 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     406.17 ms /   172 tokens (    2.36 ms per token,   423.47 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     407.59 ms /   173 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     682.81 ms /   255 tokens (    2.68 ms per token,   373.46 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     684.81 ms /   256 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     497.18 ms /   221 tokens (    2.25 ms per token,   444.50 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     498.76 ms /   222 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     575.07 ms /   245 tokens (    2.35 ms per token,   426.04 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     576.37 ms /   246 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     841.58 ms /   300 tokens (    2.81 ms per token,   356.47 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     842.80 ms /   301 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     689.30 ms /   274 tokens (    2.52 ms per token,   397.50 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     691.03 ms /   275 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     865.68 ms /   336 tokens (    2.58 ms per token,   388.13 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     867.63 ms /   337 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     390.48 ms /   149 tokens (    2.62 ms per token,   381.59 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     391.88 ms /   150 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =    1174.49 ms /   424 tokens (    2.77 ms per token,   361.01 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =    1176.45 ms /   425 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     469.53 ms /   178 tokens (    2.64 ms per token,   379.10 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     471.27 ms /   179 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     685.84 ms /   269 tokens (    2.55 ms per token,   392.22 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     687.94 ms /   270 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     493.98 ms /   204 tokens (    2.42 ms per token,   412.98 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     495.85 ms /   205 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     449.78 ms /   170 tokens (    2.65 ms per token,   377.97 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     451.98 ms /   171 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     639.55 ms /   239 tokens (    2.68 ms per token,   373.70 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     641.36 ms /   240 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     663.26 ms /   217 tokens (    3.06 ms per token,   327.17 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     665.74 ms /   218 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     815.57 ms /   302 tokens (    2.70 ms per token,   370.29 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     818.12 ms /   303 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     944.62 ms /   390 tokens (    2.42 ms per token,   412.86 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     946.52 ms /   391 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     267.22 ms /   119 tokens (    2.25 ms per token,   445.33 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     268.77 ms /   120 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     364.68 ms /   163 tokens (    2.24 ms per token,   446.97 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     366.53 ms /   164 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     729.87 ms /   321 tokens (    2.27 ms per token,   439.80 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     732.37 ms /   322 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     572.02 ms /   252 tokens (    2.27 ms per token,   440.54 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     574.13 ms /   253 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     725.83 ms /   330 tokens (    2.20 ms per token,   454.65 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     726.92 ms /   331 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     418.42 ms /   183 tokens (    2.29 ms per token,   437.36 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     419.69 ms /   184 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     663.17 ms /   295 tokens (    2.25 ms per token,   444.83 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     664.42 ms /   296 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     582.73 ms /   245 tokens (    2.38 ms per token,   420.43 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     584.13 ms /   246 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     501.50 ms /   223 tokens (    2.25 ms per token,   444.67 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     502.65 ms /   224 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     265.22 ms /   118 tokens (    2.25 ms per token,   444.91 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     266.79 ms /   119 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     693.83 ms /   303 tokens (    2.29 ms per token,   436.70 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     695.73 ms /   304 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     754.40 ms /   336 tokens (    2.25 ms per token,   445.39 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     756.21 ms /   337 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     533.54 ms /   237 tokens (    2.25 ms per token,   444.20 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     536.26 ms /   238 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     725.51 ms /   312 tokens (    2.33 ms per token,   430.04 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     727.59 ms /   313 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     673.86 ms /   296 tokens (    2.28 ms per token,   439.26 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     676.58 ms /   297 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     668.91 ms /   291 tokens (    2.30 ms per token,   435.04 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     671.33 ms /   292 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     405.67 ms /   182 tokens (    2.23 ms per token,   448.64 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     407.57 ms /   183 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     578.46 ms /   244 tokens (    2.37 ms per token,   421.81 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     580.57 ms /   245 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     509.46 ms /   232 tokens (    2.20 ms per token,   455.38 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     511.46 ms /   233 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     546.65 ms /   239 tokens (    2.29 ms per token,   437.21 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     548.63 ms /   240 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     652.30 ms /   293 tokens (    2.23 ms per token,   449.18 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     654.41 ms /   294 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     599.42 ms /   273 tokens (    2.20 ms per token,   455.44 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     601.66 ms /   274 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     905.44 ms /   375 tokens (    2.41 ms per token,   414.16 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     908.38 ms /   376 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     427.97 ms /   177 tokens (    2.42 ms per token,   413.58 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     429.95 ms /   178 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     530.73 ms /   232 tokens (    2.29 ms per token,   437.13 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     533.31 ms /   233 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     574.77 ms /   262 tokens (    2.19 ms per token,   455.83 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     577.55 ms /   263 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     584.72 ms /   266 tokens (    2.20 ms per token,   454.92 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     586.93 ms /   267 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     802.62 ms /   347 tokens (    2.31 ms per token,   432.33 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     805.39 ms /   348 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     687.14 ms /   297 tokens (    2.31 ms per token,   432.22 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     689.54 ms /   298 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     599.38 ms /   280 tokens (    2.14 ms per token,   467.15 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     601.32 ms /   281 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     703.13 ms /   303 tokens (    2.32 ms per token,   430.93 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     705.12 ms /   304 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     468.12 ms /   213 tokens (    2.20 ms per token,   455.02 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     470.19 ms /   214 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     410.94 ms /   192 tokens (    2.14 ms per token,   467.22 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     413.45 ms /   193 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     669.94 ms /   299 tokens (    2.24 ms per token,   446.31 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     672.83 ms /   300 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     675.88 ms /   297 tokens (    2.28 ms per token,   439.43 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     677.98 ms /   298 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     724.75 ms /   305 tokens (    2.38 ms per token,   420.83 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     727.35 ms /   306 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     486.21 ms /   223 tokens (    2.18 ms per token,   458.65 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     488.10 ms /   224 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     475.07 ms /   216 tokens (    2.20 ms per token,   454.67 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     477.43 ms /   217 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     699.90 ms /   299 tokens (    2.34 ms per token,   427.20 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     702.58 ms /   300 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =    1002.27 ms /   419 tokens (    2.39 ms per token,   418.05 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =    1004.76 ms /   420 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     565.80 ms /   263 tokens (    2.15 ms per token,   464.83 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     568.64 ms /   264 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     730.80 ms /   301 tokens (    2.43 ms per token,   411.88 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     732.99 ms /   302 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     414.79 ms /   196 tokens (    2.12 ms per token,   472.53 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     417.55 ms /   197 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     636.49 ms /   283 tokens (    2.25 ms per token,   444.62 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     639.24 ms /   284 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     409.02 ms /   192 tokens (    2.13 ms per token,   469.42 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     410.91 ms /   193 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     724.72 ms /   315 tokens (    2.30 ms per token,   434.65 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     727.44 ms /   316 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     627.41 ms /   282 tokens (    2.22 ms per token,   449.46 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     629.95 ms /   283 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     466.80 ms /   220 tokens (    2.12 ms per token,   471.29 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     469.55 ms /   221 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     742.45 ms /   316 tokens (    2.35 ms per token,   425.62 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     745.41 ms /   317 tokens


6 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     549.89 ms /   243 tokens (    2.26 ms per token,   441.90 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     552.12 ms /   244 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     490.73 ms /   240 tokens (    2.04 ms per token,   489.06 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     492.73 ms /   241 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     522.04 ms /   226 tokens (    2.31 ms per token,   432.92 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     524.70 ms /   227 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     540.54 ms /   256 tokens (    2.11 ms per token,   473.60 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     543.00 ms /   257 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     485.25 ms /   222 tokens (    2.19 ms per token,   457.50 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     487.97 ms /   223 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     582.35 ms /   264 tokens (    2.21 ms per token,   453.33 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     585.10 ms /   265 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     577.57 ms /   265 tokens (    2.18 ms per token,   458.82 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     579.81 ms /   266 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     497.60 ms /   230 tokens (    2.16 ms per token,   462.22 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     500.24 ms /   231 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     427.52 ms /   186 tokens (    2.30 ms per token,   435.07 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     430.08 ms /   187 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     312.93 ms /   150 tokens (    2.09 ms per token,   479.35 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     314.92 ms /   151 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     594.72 ms /   266 tokens (    2.24 ms per token,   447.27 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     597.57 ms /   267 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     685.63 ms /   299 tokens (    2.29 ms per token,   436.09 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     688.13 ms /   300 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     417.76 ms /   183 tokens (    2.28 ms per token,   438.05 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     419.62 ms /   184 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     639.43 ms /   285 tokens (    2.24 ms per token,   445.71 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     642.22 ms /   286 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     516.62 ms /   232 tokens (    2.23 ms per token,   449.07 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     518.99 ms /   233 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     728.12 ms /   327 tokens (    2.23 ms per token,   449.10 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     730.20 ms /   328 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     510.49 ms /   232 tokens (    2.20 ms per token,   454.47 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     512.80 ms /   233 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     592.70 ms /   264 tokens (    2.25 ms per token,   445.42 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     595.63 ms /   265 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     738.67 ms /   316 tokens (    2.34 ms per token,   427.80 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     740.91 ms /   317 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     438.16 ms /   206 tokens (    2.13 ms per token,   470.14 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     440.03 ms /   207 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     656.95 ms /   289 tokens (    2.27 ms per token,   439.91 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     658.96 ms /   290 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     392.28 ms /   178 tokens (    2.20 ms per token,   453.75 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     393.99 ms /   179 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     944.56 ms /   410 tokens (    2.30 ms per token,   434.06 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     947.11 ms /   411 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     541.07 ms /   233 tokens (    2.32 ms per token,   430.63 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     543.61 ms /   234 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     717.47 ms /   308 tokens (    2.33 ms per token,   429.29 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     720.48 ms /   309 tokens


1 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     601.87 ms /   266 tokens (    2.26 ms per token,   441.96 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     604.33 ms /   267 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     910.17 ms /   390 tokens (    2.33 ms per token,   428.49 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     912.40 ms /   391 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     688.37 ms /   298 tokens (    2.31 ms per token,   432.91 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     691.01 ms /   299 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     725.34 ms /   326 tokens (    2.22 ms per token,   449.45 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     727.50 ms /   327 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     550.78 ms /   237 tokens (    2.32 ms per token,   430.30 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     553.08 ms /   238 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     772.21 ms /   337 tokens (    2.29 ms per token,   436.41 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     774.43 ms /   338 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     527.04 ms /   226 tokens (    2.33 ms per token,   428.81 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     529.14 ms /   227 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =    1009.56 ms /   388 tokens (    2.60 ms per token,   384.33 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =    1012.75 ms /   389 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     551.04 ms /   246 tokens (    2.24 ms per token,   446.43 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     553.12 ms /   247 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     542.09 ms /   212 tokens (    2.56 ms per token,   391.08 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     544.62 ms /   213 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     596.66 ms /   270 tokens (    2.21 ms per token,   452.52 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     599.20 ms /   271 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     458.50 ms /   213 tokens (    2.15 ms per token,   464.55 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     460.84 ms /   214 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     429.95 ms /   204 tokens (    2.11 ms per token,   474.47 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     432.72 ms /   205 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     528.49 ms /   239 tokens (    2.21 ms per token,   452.23 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     530.55 ms /   240 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     472.76 ms /   214 tokens (    2.21 ms per token,   452.66 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     475.40 ms /   215 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     642.42 ms /   284 tokens (    2.26 ms per token,   442.08 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     644.82 ms /   285 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     793.31 ms /   350 tokens (    2.27 ms per token,   441.19 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     795.56 ms /   351 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     558.12 ms /   243 tokens (    2.30 ms per token,   435.39 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     560.43 ms /   244 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     241.58 ms /   109 tokens (    2.22 ms per token,   451.19 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     243.88 ms /   110 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     452.17 ms /   191 tokens (    2.37 ms per token,   422.41 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     454.77 ms /   192 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     787.23 ms /   350 tokens (    2.25 ms per token,   444.60 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     790.19 ms /   351 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     531.88 ms /   233 tokens (    2.28 ms per token,   438.07 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     534.28 ms /   234 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     553.36 ms /   257 tokens (    2.15 ms per token,   464.43 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     555.74 ms /   258 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     776.89 ms /   352 tokens (    2.21 ms per token,   453.09 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     779.84 ms /   353 tokens


6 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     929.70 ms /   399 tokens (    2.33 ms per token,   429.17 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     932.63 ms /   400 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     354.64 ms /   165 tokens (    2.15 ms per token,   465.26 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     357.24 ms /   166 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     946.73 ms /   403 tokens (    2.35 ms per token,   425.68 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     949.17 ms /   404 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     536.65 ms /   241 tokens (    2.23 ms per token,   449.08 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     538.57 ms /   242 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     493.42 ms /   240 tokens (    2.06 ms per token,   486.40 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     495.47 ms /   241 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     767.03 ms /   337 tokens (    2.28 ms per token,   439.36 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     769.52 ms /   338 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     731.44 ms /   308 tokens (    2.37 ms per token,   421.09 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     733.95 ms /   309 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     622.48 ms /   282 tokens (    2.21 ms per token,   453.02 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     625.05 ms /   283 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     553.71 ms /   243 tokens (    2.28 ms per token,   438.86 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     555.74 ms /   244 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     585.55 ms /   253 tokens (    2.31 ms per token,   432.07 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     587.60 ms /   254 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     592.33 ms /   267 tokens (    2.22 ms per token,   450.76 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     595.18 ms /   268 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     442.81 ms /   209 tokens (    2.12 ms per token,   471.98 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     444.84 ms /   210 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     850.73 ms /   314 tokens (    2.71 ms per token,   369.10 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     852.96 ms /   315 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =    1036.56 ms /   433 tokens (    2.39 ms per token,   417.73 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =    1039.37 ms /   434 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     580.88 ms /   269 tokens (    2.16 ms per token,   463.09 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     582.86 ms /   270 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     545.01 ms /   239 tokens (    2.28 ms per token,   438.52 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     547.17 ms /   240 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     567.43 ms /   261 tokens (    2.17 ms per token,   459.97 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     570.19 ms /   262 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     501.20 ms /   227 tokens (    2.21 ms per token,   452.91 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     503.83 ms /   228 tokens


6 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     440.99 ms /   201 tokens (    2.19 ms per token,   455.80 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     443.05 ms /   202 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =    1001.88 ms /   423 tokens (    2.37 ms per token,   422.21 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =    1004.31 ms /   424 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     472.90 ms /   224 tokens (    2.11 ms per token,   473.68 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     475.58 ms /   225 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     741.86 ms /   313 tokens (    2.37 ms per token,   421.91 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     744.27 ms /   314 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     651.33 ms /   283 tokens (    2.30 ms per token,   434.50 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     653.85 ms /   284 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     555.77 ms /   237 tokens (    2.35 ms per token,   426.43 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     558.32 ms /   238 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     486.00 ms /   209 tokens (    2.33 ms per token,   430.05 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     488.38 ms /   210 tokens


1 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     405.11 ms /   185 tokens (    2.19 ms per token,   456.67 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     406.55 ms /   186 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     448.29 ms /   199 tokens (    2.25 ms per token,   443.91 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     449.87 ms /   200 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     575.32 ms /   266 tokens (    2.16 ms per token,   462.35 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     576.95 ms /   267 tokens


1 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     723.64 ms /   324 tokens (    2.23 ms per token,   447.74 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     725.40 ms /   325 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     609.96 ms /   266 tokens (    2.29 ms per token,   436.09 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     611.60 ms /   267 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     444.04 ms /   209 tokens (    2.12 ms per token,   470.68 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     445.58 ms /   210 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     596.12 ms /   274 tokens (    2.18 ms per token,   459.64 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     598.43 ms /   275 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     488.86 ms /   219 tokens (    2.23 ms per token,   447.98 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     491.05 ms /   220 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     581.30 ms /   270 tokens (    2.15 ms per token,   464.47 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     582.89 ms /   271 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     695.39 ms /   301 tokens (    2.31 ms per token,   432.85 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     697.29 ms /   302 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     724.80 ms /   306 tokens (    2.37 ms per token,   422.19 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     726.74 ms /   307 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =    1252.81 ms /   503 tokens (    2.49 ms per token,   401.50 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =    1255.07 ms /   504 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     567.09 ms /   249 tokens (    2.28 ms per token,   439.08 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     568.96 ms /   250 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     711.31 ms /   307 tokens (    2.32 ms per token,   431.60 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     713.43 ms /   308 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     293.95 ms /   139 tokens (    2.11 ms per token,   472.87 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     295.89 ms /   140 tokens


9 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     337.43 ms /   154 tokens (    2.19 ms per token,   456.39 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     339.35 ms /   155 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     661.37 ms /   291 tokens (    2.27 ms per token,   440.00 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     663.39 ms /   292 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     677.00 ms /   300 tokens (    2.26 ms per token,   443.13 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     680.04 ms /   301 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     528.68 ms /   238 tokens (    2.22 ms per token,   450.18 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     530.81 ms /   239 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     478.10 ms /   218 tokens (    2.19 ms per token,   455.97 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     480.29 ms /   219 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     561.64 ms /   245 tokens (    2.29 ms per token,   436.22 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     563.96 ms /   246 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     516.26 ms /   231 tokens (    2.23 ms per token,   447.45 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     518.30 ms /   232 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     510.30 ms /   231 tokens (    2.21 ms per token,   452.67 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     513.09 ms /   232 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     577.37 ms /   265 tokens (    2.18 ms per token,   458.98 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     579.77 ms /   266 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     890.38 ms /   388 tokens (    2.29 ms per token,   435.77 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     893.39 ms /   389 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     643.43 ms /   286 tokens (    2.25 ms per token,   444.49 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     645.80 ms /   287 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     415.51 ms /   181 tokens (    2.30 ms per token,   435.60 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     417.39 ms /   182 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     445.59 ms /   206 tokens (    2.16 ms per token,   462.31 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     447.91 ms /   207 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     330.52 ms /   152 tokens (    2.17 ms per token,   459.88 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     332.50 ms /   153 tokens


1 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     369.15 ms /   163 tokens (    2.26 ms per token,   441.56 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     371.00 ms /   164 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     616.63 ms /   278 tokens (    2.22 ms per token,   450.83 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     618.89 ms /   279 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     789.33 ms /   345 tokens (    2.29 ms per token,   437.08 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     792.25 ms /   346 tokens


6 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     328.21 ms /   160 tokens (    2.05 ms per token,   487.49 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     330.35 ms /   161 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     595.45 ms /   273 tokens (    2.18 ms per token,   458.48 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     597.44 ms /   274 tokens


8 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     542.74 ms /   227 tokens (    2.39 ms per token,   418.25 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     545.04 ms /   228 tokens


1 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     644.99 ms /   291 tokens (    2.22 ms per token,   451.17 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     647.30 ms /   292 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     515.63 ms /   240 tokens (    2.15 ms per token,   465.45 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     518.29 ms /   241 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     603.62 ms /   272 tokens (    2.22 ms per token,   450.62 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     605.83 ms /   273 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     291.35 ms /   133 tokens (    2.19 ms per token,   456.50 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     293.00 ms /   134 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     393.10 ms /   174 tokens (    2.26 ms per token,   442.64 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     394.94 ms /   175 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     374.62 ms /   175 tokens (    2.14 ms per token,   467.14 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     376.81 ms /   176 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     667.60 ms /   298 tokens (    2.24 ms per token,   446.37 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     670.29 ms /   299 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     503.23 ms /   223 tokens (    2.26 ms per token,   443.14 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     505.50 ms /   224 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =    1074.73 ms /   442 tokens (    2.43 ms per token,   411.26 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =    1077.29 ms /   443 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     943.45 ms /   402 tokens (    2.35 ms per token,   426.10 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     946.15 ms /   403 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     509.26 ms /   232 tokens (    2.20 ms per token,   455.56 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     511.24 ms /   233 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     474.22 ms /   218 tokens (    2.18 ms per token,   459.71 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     476.05 ms /   219 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     786.89 ms /   340 tokens (    2.31 ms per token,   432.08 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     789.65 ms /   341 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     338.10 ms /   157 tokens (    2.15 ms per token,   464.36 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     340.35 ms /   158 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     415.37 ms /   200 tokens (    2.08 ms per token,   481.49 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     417.39 ms /   201 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     555.90 ms /   250 tokens (    2.22 ms per token,   449.72 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     558.21 ms /   251 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     460.13 ms /   210 tokens (    2.19 ms per token,   456.39 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     462.55 ms /   211 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     876.78 ms /   366 tokens (    2.40 ms per token,   417.44 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     879.44 ms /   367 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     409.33 ms /   179 tokens (    2.29 ms per token,   437.30 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     411.26 ms /   180 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     559.62 ms /   242 tokens (    2.31 ms per token,   432.43 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     562.00 ms /   243 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     688.47 ms /   302 tokens (    2.28 ms per token,   438.66 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     690.89 ms /   303 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     618.34 ms /   279 tokens (    2.22 ms per token,   451.21 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     620.30 ms /   280 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     465.13 ms /   218 tokens (    2.13 ms per token,   468.69 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     467.00 ms /   219 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     521.01 ms /   227 tokens (    2.30 ms per token,   435.69 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     523.21 ms /   228 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     565.99 ms /   251 tokens (    2.25 ms per token,   443.47 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     568.17 ms /   252 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     839.43 ms /   352 tokens (    2.38 ms per token,   419.33 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     842.07 ms /   353 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     378.81 ms /   161 tokens (    2.35 ms per token,   425.01 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     381.44 ms /   162 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     372.23 ms /   175 tokens (    2.13 ms per token,   470.14 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     374.56 ms /   176 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     257.91 ms /   120 tokens (    2.15 ms per token,   465.28 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     260.45 ms /   121 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     570.32 ms /   263 tokens (    2.17 ms per token,   461.14 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     572.61 ms /   264 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     542.61 ms /   244 tokens (    2.22 ms per token,   449.68 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     545.05 ms /   245 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     271.87 ms /   104 tokens (    2.61 ms per token,   382.54 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     274.51 ms /   105 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     536.48 ms /   256 tokens (    2.10 ms per token,   477.19 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     538.56 ms /   257 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     775.35 ms /   345 tokens (    2.25 ms per token,   444.96 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     778.15 ms /   346 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     760.23 ms /   319 tokens (    2.38 ms per token,   419.61 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     762.59 ms /   320 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     569.94 ms /   270 tokens (    2.11 ms per token,   473.73 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     572.15 ms /   271 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     519.96 ms /   235 tokens (    2.21 ms per token,   451.96 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     521.96 ms /   236 tokens


1 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     644.60 ms /   285 tokens (    2.26 ms per token,   442.14 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     647.02 ms /   286 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     468.46 ms /   217 tokens (    2.16 ms per token,   463.22 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     471.20 ms /   218 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     564.46 ms /   259 tokens (    2.18 ms per token,   458.85 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     566.39 ms /   260 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     569.51 ms /   272 tokens (    2.09 ms per token,   477.60 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     572.10 ms /   273 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     680.17 ms /   293 tokens (    2.32 ms per token,   430.78 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     682.58 ms /   294 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     598.06 ms /   280 tokens (    2.14 ms per token,   468.18 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     600.31 ms /   281 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     469.97 ms /   215 tokens (    2.19 ms per token,   457.47 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     472.43 ms /   216 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     675.31 ms /   294 tokens (    2.30 ms per token,   435.36 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     677.75 ms /   295 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     555.00 ms /   262 tokens (    2.12 ms per token,   472.07 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     557.40 ms /   263 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     212.83 ms /    92 tokens (    2.31 ms per token,   432.27 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     215.36 ms /    93 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     396.38 ms /   180 tokens (    2.20 ms per token,   454.11 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     398.72 ms /   181 tokens


1 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     306.11 ms /   143 tokens (    2.14 ms per token,   467.15 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     308.62 ms /   144 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     629.16 ms /   280 tokens (    2.25 ms per token,   445.04 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     631.80 ms /   281 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     338.36 ms /   157 tokens (    2.16 ms per token,   464.01 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     340.60 ms /   158 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     562.86 ms /   245 tokens (    2.30 ms per token,   435.28 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     565.43 ms /   246 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     835.64 ms /   359 tokens (    2.33 ms per token,   429.61 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     838.56 ms /   360 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     613.52 ms /   285 tokens (    2.15 ms per token,   464.53 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     615.60 ms /   286 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     577.69 ms /   255 tokens (    2.27 ms per token,   441.41 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     580.07 ms /   256 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     315.92 ms /   148 tokens (    2.13 ms per token,   468.47 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     317.57 ms /   149 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     412.42 ms /   173 tokens (    2.38 ms per token,   419.48 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     414.66 ms /   174 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     425.70 ms /   205 tokens (    2.08 ms per token,   481.56 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     428.08 ms /   206 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     556.15 ms /   257 tokens (    2.16 ms per token,   462.11 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     558.50 ms /   258 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     436.13 ms /   210 tokens (    2.08 ms per token,   481.50 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     438.47 ms /   211 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     560.88 ms /   242 tokens (    2.32 ms per token,   431.47 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     562.81 ms /   243 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     808.04 ms /   360 tokens (    2.24 ms per token,   445.52 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     810.22 ms /   361 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =    1056.87 ms /   414 tokens (    2.55 ms per token,   391.72 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =    1059.13 ms /   415 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     410.83 ms /   185 tokens (    2.22 ms per token,   450.31 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     413.27 ms /   186 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     412.88 ms /   196 tokens (    2.11 ms per token,   474.71 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     415.16 ms /   197 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     854.22 ms /   367 tokens (    2.33 ms per token,   429.63 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     857.33 ms /   368 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     534.69 ms /   229 tokens (    2.33 ms per token,   428.29 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     536.76 ms /   230 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     401.82 ms /   183 tokens (    2.20 ms per token,   455.42 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     403.98 ms /   184 tokens


8 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     743.61 ms /   332 tokens (    2.24 ms per token,   446.47 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     746.34 ms /   333 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     316.73 ms /   145 tokens (    2.18 ms per token,   457.80 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     318.42 ms /   146 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     753.45 ms /   336 tokens (    2.24 ms per token,   445.95 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     755.70 ms /   337 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     331.97 ms /   151 tokens (    2.20 ms per token,   454.86 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     334.06 ms /   152 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     431.20 ms /   187 tokens (    2.31 ms per token,   433.67 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     433.31 ms /   188 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     773.33 ms /   321 tokens (    2.41 ms per token,   415.09 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     776.03 ms /   322 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     428.40 ms /   204 tokens (    2.10 ms per token,   476.19 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     430.70 ms /   205 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     724.50 ms /   315 tokens (    2.30 ms per token,   434.78 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     726.62 ms /   316 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     432.47 ms /   204 tokens (    2.12 ms per token,   471.71 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     434.31 ms /   205 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     403.11 ms /   172 tokens (    2.34 ms per token,   426.69 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     405.09 ms /   173 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     553.77 ms /   264 tokens (    2.10 ms per token,   476.73 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     555.62 ms /   265 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     397.92 ms /   175 tokens (    2.27 ms per token,   439.79 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     400.33 ms /   176 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     467.76 ms /   219 tokens (    2.14 ms per token,   468.19 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     469.70 ms /   220 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     695.72 ms /   292 tokens (    2.38 ms per token,   419.71 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     698.65 ms /   293 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     657.32 ms /   292 tokens (    2.25 ms per token,   444.23 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     660.27 ms /   293 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     550.22 ms /   250 tokens (    2.20 ms per token,   454.36 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     552.75 ms /   251 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     365.18 ms /   164 tokens (    2.23 ms per token,   449.09 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     367.09 ms /   165 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     741.31 ms /   307 tokens (    2.41 ms per token,   414.13 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     743.62 ms /   308 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     474.23 ms /   216 tokens (    2.20 ms per token,   455.47 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     476.58 ms /   217 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     503.64 ms /   231 tokens (    2.18 ms per token,   458.66 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     506.15 ms /   232 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     417.21 ms /   179 tokens (    2.33 ms per token,   429.04 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     419.91 ms /   180 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     658.01 ms /   293 tokens (    2.25 ms per token,   445.28 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     660.36 ms /   294 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     466.58 ms /   211 tokens (    2.21 ms per token,   452.23 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     468.93 ms /   212 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     329.33 ms /   151 tokens (    2.18 ms per token,   458.51 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     331.59 ms /   152 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     445.91 ms /   201 tokens (    2.22 ms per token,   450.77 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     447.72 ms /   202 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     566.72 ms /   265 tokens (    2.14 ms per token,   467.60 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     569.33 ms /   266 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     557.24 ms /   248 tokens (    2.25 ms per token,   445.05 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     559.15 ms /   249 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     609.26 ms /   278 tokens (    2.19 ms per token,   456.29 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     611.41 ms /   279 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     732.55 ms /   311 tokens (    2.36 ms per token,   424.55 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     735.63 ms /   312 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     663.10 ms /   295 tokens (    2.25 ms per token,   444.88 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     665.43 ms /   296 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     579.80 ms /   255 tokens (    2.27 ms per token,   439.80 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     582.67 ms /   256 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     585.85 ms /   269 tokens (    2.18 ms per token,   459.17 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     588.76 ms /   270 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     558.48 ms /   259 tokens (    2.16 ms per token,   463.76 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     560.95 ms /   260 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     990.21 ms /   409 tokens (    2.42 ms per token,   413.04 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     992.95 ms /   410 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     703.98 ms /   305 tokens (    2.31 ms per token,   433.25 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     706.01 ms /   306 tokens


1 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     559.25 ms /   248 tokens (    2.26 ms per token,   443.45 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     561.20 ms /   249 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     865.69 ms /   327 tokens (    2.65 ms per token,   377.73 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     868.30 ms /   328 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     901.13 ms /   380 tokens (    2.37 ms per token,   421.69 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     903.86 ms /   381 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     402.44 ms /   194 tokens (    2.07 ms per token,   482.06 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     404.93 ms /   195 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     622.07 ms /   276 tokens (    2.25 ms per token,   443.68 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     624.83 ms /   277 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     375.94 ms /   167 tokens (    2.25 ms per token,   444.22 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     378.41 ms /   168 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     696.84 ms /   305 tokens (    2.28 ms per token,   437.69 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     699.30 ms /   306 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     893.64 ms /   389 tokens (    2.30 ms per token,   435.30 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     896.68 ms /   390 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     560.71 ms /   259 tokens (    2.16 ms per token,   461.91 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     563.23 ms /   260 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     714.21 ms /   321 tokens (    2.22 ms per token,   449.45 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     716.71 ms /   322 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     212.39 ms /    96 tokens (    2.21 ms per token,   451.99 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     214.62 ms /    97 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     785.16 ms /   345 tokens (    2.28 ms per token,   439.40 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     788.22 ms /   346 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     730.27 ms /   328 tokens (    2.23 ms per token,   449.15 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     733.32 ms /   329 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     547.58 ms /   250 tokens (    2.19 ms per token,   456.56 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     550.20 ms /   251 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     472.33 ms /   206 tokens (    2.29 ms per token,   436.14 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     475.67 ms /   207 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     631.16 ms /   279 tokens (    2.26 ms per token,   442.04 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     633.15 ms /   280 tokens


6 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     740.10 ms /   318 tokens (    2.33 ms per token,   429.67 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     742.31 ms /   319 tokens


1 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     604.26 ms /   253 tokens (    2.39 ms per token,   418.69 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     606.30 ms /   254 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     760.68 ms /   338 tokens (    2.25 ms per token,   444.34 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     763.45 ms /   339 tokens


6 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     412.83 ms /   198 tokens (    2.08 ms per token,   479.62 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     414.84 ms /   199 tokens


1 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     752.52 ms /   312 tokens (    2.41 ms per token,   414.61 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     755.14 ms /   313 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     482.53 ms /   222 tokens (    2.17 ms per token,   460.08 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     484.91 ms /   223 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     448.87 ms /   208 tokens (    2.16 ms per token,   463.38 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     451.51 ms /   209 tokens


1 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     613.43 ms /   288 tokens (    2.13 ms per token,   469.49 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     615.66 ms /   289 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     405.05 ms /   177 tokens (    2.29 ms per token,   436.98 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     407.39 ms /   178 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     672.31 ms /   252 tokens (    2.67 ms per token,   374.83 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     675.22 ms /   253 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     606.95 ms /   275 tokens (    2.21 ms per token,   453.09 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     609.08 ms /   276 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     558.46 ms /   257 tokens (    2.17 ms per token,   460.19 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     561.31 ms /   258 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     570.41 ms /   262 tokens (    2.18 ms per token,   459.32 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     572.90 ms /   263 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     673.62 ms /   300 tokens (    2.25 ms per token,   445.35 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     675.66 ms /   301 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     494.18 ms /   217 tokens (    2.28 ms per token,   439.11 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     496.48 ms /   218 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     627.77 ms /   281 tokens (    2.23 ms per token,   447.61 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     630.65 ms /   282 tokens


1 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     717.11 ms /   322 tokens (    2.23 ms per token,   449.02 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     719.75 ms /   323 tokens


1 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     511.61 ms /   232 tokens (    2.21 ms per token,   453.47 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     514.47 ms /   233 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     479.12 ms /   220 tokens (    2.18 ms per token,   459.17 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     481.28 ms /   221 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     372.20 ms /   171 tokens (    2.18 ms per token,   459.43 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     374.69 ms /   172 tokens


6 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     491.60 ms /   221 tokens (    2.22 ms per token,   449.56 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     493.90 ms /   222 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     443.84 ms /   209 tokens (    2.12 ms per token,   470.89 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     446.63 ms /   210 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     463.33 ms /   207 tokens (    2.24 ms per token,   446.77 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     465.41 ms /   208 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     775.03 ms /   319 tokens (    2.43 ms per token,   411.60 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     777.54 ms /   320 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     545.56 ms /   258 tokens (    2.11 ms per token,   472.91 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     547.62 ms /   259 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     756.90 ms /   340 tokens (    2.23 ms per token,   449.20 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     759.83 ms /   341 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     745.85 ms /   329 tokens (    2.27 ms per token,   441.11 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     748.65 ms /   330 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     608.90 ms /   280 tokens (    2.17 ms per token,   459.85 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     611.74 ms /   281 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     580.36 ms /   270 tokens (    2.15 ms per token,   465.23 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     582.84 ms /   271 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     716.24 ms /   308 tokens (    2.33 ms per token,   430.02 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     718.68 ms /   309 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     398.09 ms /   185 tokens (    2.15 ms per token,   464.72 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     400.42 ms /   186 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     816.35 ms /   349 tokens (    2.34 ms per token,   427.51 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     818.59 ms /   350 tokens


1 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     594.59 ms /   270 tokens (    2.20 ms per token,   454.10 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     597.27 ms /   271 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     537.63 ms /   242 tokens (    2.22 ms per token,   450.12 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     539.88 ms /   243 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =    1031.57 ms /   426 tokens (    2.42 ms per token,   412.96 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =    1034.00 ms /   427 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     584.21 ms /   272 tokens (    2.15 ms per token,   465.59 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     587.22 ms /   273 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     699.36 ms /   258 tokens (    2.71 ms per token,   368.91 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     701.99 ms /   259 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     551.41 ms /   260 tokens (    2.12 ms per token,   471.52 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     553.74 ms /   261 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     639.14 ms /   285 tokens (    2.24 ms per token,   445.91 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     641.17 ms /   286 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     735.00 ms /   331 tokens (    2.22 ms per token,   450.34 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     737.12 ms /   332 tokens


8 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     606.39 ms /   280 tokens (    2.17 ms per token,   461.75 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     609.10 ms /   281 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     468.31 ms /   204 tokens (    2.30 ms per token,   435.61 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     470.57 ms /   205 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     921.37 ms /   402 tokens (    2.29 ms per token,   436.31 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     924.22 ms /   403 tokens


6 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     576.18 ms /   268 tokens (    2.15 ms per token,   465.13 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     578.87 ms /   269 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     322.87 ms /   143 tokens (    2.26 ms per token,   442.90 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     325.61 ms /   144 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     641.89 ms /   289 tokens (    2.22 ms per token,   450.23 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     643.95 ms /   290 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     754.68 ms /   331 tokens (    2.28 ms per token,   438.60 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     757.15 ms /   332 tokens


1 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     771.20 ms /   339 tokens (    2.27 ms per token,   439.57 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     773.48 ms /   340 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     587.99 ms /   271 tokens (    2.17 ms per token,   460.89 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     590.18 ms /   272 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     565.11 ms /   265 tokens (    2.13 ms per token,   468.93 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     567.35 ms /   266 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     619.53 ms /   277 tokens (    2.24 ms per token,   447.12 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     622.33 ms /   278 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     667.37 ms /   304 tokens (    2.20 ms per token,   455.52 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     669.51 ms /   305 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     562.82 ms /   257 tokens (    2.19 ms per token,   456.63 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     565.60 ms /   258 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     319.36 ms /   147 tokens (    2.17 ms per token,   460.29 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     321.46 ms /   148 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =    1124.69 ms /   447 tokens (    2.52 ms per token,   397.44 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =    1127.06 ms /   448 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     441.12 ms /   202 tokens (    2.18 ms per token,   457.93 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     443.63 ms /   203 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     600.44 ms /   275 tokens (    2.18 ms per token,   458.00 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     603.35 ms /   276 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     753.49 ms /   335 tokens (    2.25 ms per token,   444.60 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     755.87 ms /   336 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     546.19 ms /   244 tokens (    2.24 ms per token,   446.73 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     549.04 ms /   245 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     432.65 ms /   204 tokens (    2.12 ms per token,   471.51 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     434.86 ms /   205 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     617.11 ms /   268 tokens (    2.30 ms per token,   434.28 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     619.78 ms /   269 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     266.86 ms /   116 tokens (    2.30 ms per token,   434.68 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     269.31 ms /   117 tokens


1 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     409.40 ms /   200 tokens (    2.05 ms per token,   488.52 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     411.84 ms /   201 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =    1023.72 ms /   422 tokens (    2.43 ms per token,   412.22 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =    1026.43 ms /   423 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     726.25 ms /   313 tokens (    2.32 ms per token,   430.98 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     729.04 ms /   314 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     676.76 ms /   297 tokens (    2.28 ms per token,   438.86 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     679.34 ms /   298 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     529.56 ms /   228 tokens (    2.32 ms per token,   430.55 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     532.23 ms /   229 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     652.17 ms /   287 tokens (    2.27 ms per token,   440.07 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     654.36 ms /   288 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     359.13 ms /   158 tokens (    2.27 ms per token,   439.95 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     361.26 ms /   159 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     425.52 ms /   187 tokens (    2.28 ms per token,   439.46 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     427.60 ms /   188 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     666.15 ms /   291 tokens (    2.29 ms per token,   436.84 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     668.79 ms /   292 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =    1063.03 ms /   438 tokens (    2.43 ms per token,   412.03 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =    1066.02 ms /   439 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     498.64 ms /   229 tokens (    2.18 ms per token,   459.25 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     501.51 ms /   230 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     602.25 ms /   271 tokens (    2.22 ms per token,   449.98 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     605.12 ms /   272 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     379.85 ms /   172 tokens (    2.21 ms per token,   452.82 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     382.28 ms /   173 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     433.86 ms /   189 tokens (    2.30 ms per token,   435.63 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     436.27 ms /   190 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     484.40 ms /   222 tokens (    2.18 ms per token,   458.30 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     487.25 ms /   223 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     298.36 ms /   134 tokens (    2.23 ms per token,   449.12 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     300.64 ms /   135 tokens


1 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     591.00 ms /   269 tokens (    2.20 ms per token,   455.16 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     593.96 ms /   270 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     585.30 ms /   263 tokens (    2.23 ms per token,   449.34 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     587.51 ms /   264 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     369.21 ms /   169 tokens (    2.18 ms per token,   457.73 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     372.02 ms /   170 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     593.55 ms /   253 tokens (    2.35 ms per token,   426.25 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     595.72 ms /   254 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     857.34 ms /   384 tokens (    2.23 ms per token,   447.90 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     859.75 ms /   385 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     722.45 ms /   326 tokens (    2.22 ms per token,   451.24 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     725.54 ms /   327 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     689.81 ms /   295 tokens (    2.34 ms per token,   427.66 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     692.76 ms /   296 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     357.56 ms /   159 tokens (    2.25 ms per token,   444.68 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     359.89 ms /   160 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     745.14 ms /   333 tokens (    2.24 ms per token,   446.90 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     748.06 ms /   334 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     625.65 ms /   278 tokens (    2.25 ms per token,   444.34 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     628.62 ms /   279 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     742.55 ms /   336 tokens (    2.21 ms per token,   452.50 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     745.71 ms /   337 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     423.64 ms /   187 tokens (    2.27 ms per token,   441.41 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     426.55 ms /   188 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     753.72 ms /   336 tokens (    2.24 ms per token,   445.79 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     756.53 ms /   337 tokens


1 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     748.04 ms /   316 tokens (    2.37 ms per token,   422.43 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     750.37 ms /   317 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     749.89 ms /   338 tokens (    2.22 ms per token,   450.73 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     753.02 ms /   339 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     485.86 ms /   211 tokens (    2.30 ms per token,   434.28 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     487.80 ms /   212 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     889.56 ms /   373 tokens (    2.38 ms per token,   419.31 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     892.00 ms /   374 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     535.47 ms /   245 tokens (    2.19 ms per token,   457.55 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     537.56 ms /   246 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     501.92 ms /   222 tokens (    2.26 ms per token,   442.30 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     504.47 ms /   223 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     937.97 ms /   404 tokens (    2.32 ms per token,   430.72 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     940.56 ms /   405 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     537.38 ms /   239 tokens (    2.25 ms per token,   444.75 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     539.45 ms /   240 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     466.01 ms /   209 tokens (    2.23 ms per token,   448.49 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     467.99 ms /   210 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     429.03 ms /   196 tokens (    2.19 ms per token,   456.84 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     430.90 ms /   197 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     652.46 ms /   295 tokens (    2.21 ms per token,   452.13 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     654.86 ms /   296 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     505.64 ms /   231 tokens (    2.19 ms per token,   456.85 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     508.15 ms /   232 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     718.01 ms /   307 tokens (    2.34 ms per token,   427.57 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     720.49 ms /   308 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     686.90 ms /   297 tokens (    2.31 ms per token,   432.38 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     689.28 ms /   298 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     414.15 ms /   200 tokens (    2.07 ms per token,   482.91 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     416.40 ms /   201 tokens


1 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     492.53 ms /   193 tokens (    2.55 ms per token,   391.85 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     495.37 ms /   194 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     269.85 ms /   119 tokens (    2.27 ms per token,   440.99 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     271.94 ms /   120 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     772.19 ms /   343 tokens (    2.25 ms per token,   444.19 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     774.34 ms /   344 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     539.50 ms /   256 tokens (    2.11 ms per token,   474.51 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     542.06 ms /   257 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     667.65 ms /   304 tokens (    2.20 ms per token,   455.33 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     669.68 ms /   305 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     875.05 ms /   366 tokens (    2.39 ms per token,   418.26 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     878.24 ms /   367 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     901.45 ms /   392 tokens (    2.30 ms per token,   434.85 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     904.08 ms /   393 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     641.43 ms /   287 tokens (    2.23 ms per token,   447.44 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     644.14 ms /   288 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     534.15 ms /   241 tokens (    2.22 ms per token,   451.18 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     536.75 ms /   242 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     736.50 ms /   322 tokens (    2.29 ms per token,   437.21 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     738.63 ms /   323 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     368.47 ms /   163 tokens (    2.26 ms per token,   442.38 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     371.19 ms /   164 tokens


1 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     780.88 ms /   342 tokens (    2.28 ms per token,   437.97 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     783.28 ms /   343 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     463.06 ms /   224 tokens (    2.07 ms per token,   483.74 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     465.91 ms /   225 tokens


1 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     510.88 ms /   228 tokens (    2.24 ms per token,   446.29 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     513.68 ms /   229 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     560.13 ms /   250 tokens (    2.24 ms per token,   446.33 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     562.80 ms /   251 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     716.30 ms /   315 tokens (    2.27 ms per token,   439.76 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     718.47 ms /   316 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     588.00 ms /   253 tokens (    2.32 ms per token,   430.27 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     590.79 ms /   254 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     622.45 ms /   276 tokens (    2.26 ms per token,   443.41 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     625.28 ms /   277 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     398.63 ms /   192 tokens (    2.08 ms per token,   481.65 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     401.37 ms /   193 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     579.25 ms /   270 tokens (    2.15 ms per token,   466.12 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     581.33 ms /   271 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     635.21 ms /   288 tokens (    2.21 ms per token,   453.39 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     637.46 ms /   289 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     458.12 ms /   207 tokens (    2.21 ms per token,   451.85 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     460.86 ms /   208 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     506.89 ms /   232 tokens (    2.18 ms per token,   457.69 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     508.84 ms /   233 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     599.04 ms /   243 tokens (    2.47 ms per token,   405.65 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     601.59 ms /   244 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     749.56 ms /   314 tokens (    2.39 ms per token,   418.91 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     752.14 ms /   315 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     659.01 ms /   294 tokens (    2.24 ms per token,   446.13 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     662.08 ms /   295 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =    1229.09 ms /   512 tokens (    2.40 ms per token,   416.57 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =    1232.61 ms /   513 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     529.12 ms /   238 tokens (    2.22 ms per token,   449.80 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     532.12 ms /   239 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     451.98 ms /   209 tokens (    2.16 ms per token,   462.41 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     454.49 ms /   210 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     415.76 ms /   182 tokens (    2.28 ms per token,   437.75 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     417.84 ms /   183 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     542.50 ms /   237 tokens (    2.29 ms per token,   436.86 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     544.81 ms /   238 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     575.52 ms /   253 tokens (    2.27 ms per token,   439.60 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     577.93 ms /   254 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     644.82 ms /   289 tokens (    2.23 ms per token,   448.18 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     647.41 ms /   290 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     659.33 ms /   286 tokens (    2.31 ms per token,   433.77 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     661.50 ms /   287 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     330.90 ms /   144 tokens (    2.30 ms per token,   435.17 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     332.63 ms /   145 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     497.67 ms /   230 tokens (    2.16 ms per token,   462.15 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     499.23 ms /   231 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     439.23 ms /   208 tokens (    2.11 ms per token,   473.55 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     440.19 ms /   209 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     434.17 ms /   190 tokens (    2.29 ms per token,   437.62 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     436.43 ms /   191 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     735.01 ms /   328 tokens (    2.24 ms per token,   446.25 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     737.91 ms /   329 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     395.35 ms /   178 tokens (    2.22 ms per token,   450.23 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     397.28 ms /   179 tokens


8 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     502.20 ms /   222 tokens (    2.26 ms per token,   442.05 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     504.63 ms /   223 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     794.05 ms /   349 tokens (    2.28 ms per token,   439.52 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     796.96 ms /   350 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     555.45 ms /   246 tokens (    2.26 ms per token,   442.88 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     557.73 ms /   247 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     751.11 ms /   331 tokens (    2.27 ms per token,   440.68 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     753.68 ms /   332 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     913.23 ms /   371 tokens (    2.46 ms per token,   406.25 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     915.70 ms /   372 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     604.49 ms /   274 tokens (    2.21 ms per token,   453.28 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     607.49 ms /   275 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     474.20 ms /   215 tokens (    2.21 ms per token,   453.39 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     476.37 ms /   216 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     460.32 ms /   212 tokens (    2.17 ms per token,   460.55 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     462.65 ms /   213 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     455.94 ms /   214 tokens (    2.13 ms per token,   469.35 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     458.11 ms /   215 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     886.55 ms /   366 tokens (    2.42 ms per token,   412.84 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     889.61 ms /   367 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     583.39 ms /   247 tokens (    2.36 ms per token,   423.39 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     585.69 ms /   248 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     876.32 ms /   366 tokens (    2.39 ms per token,   417.66 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     879.53 ms /   367 tokens


6 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     289.76 ms /   123 tokens (    2.36 ms per token,   424.48 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     292.53 ms /   124 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     555.99 ms /   242 tokens (    2.30 ms per token,   435.26 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     558.53 ms /   243 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     495.78 ms /   217 tokens (    2.28 ms per token,   437.70 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     497.83 ms /   218 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     895.77 ms /   374 tokens (    2.40 ms per token,   417.52 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     898.42 ms /   375 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     414.42 ms /   180 tokens (    2.30 ms per token,   434.35 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     416.89 ms /   181 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     575.04 ms /   194 tokens (    2.96 ms per token,   337.37 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     577.20 ms /   195 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     666.77 ms /   293 tokens (    2.28 ms per token,   439.43 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     669.73 ms /   294 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     592.01 ms /   248 tokens (    2.39 ms per token,   418.91 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     594.73 ms /   249 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     645.51 ms /   261 tokens (    2.47 ms per token,   404.33 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     647.80 ms /   262 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     713.79 ms /   308 tokens (    2.32 ms per token,   431.50 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     716.83 ms /   309 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     547.51 ms /   237 tokens (    2.31 ms per token,   432.87 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     550.19 ms /   238 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     505.30 ms /   211 tokens (    2.39 ms per token,   417.58 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     507.35 ms /   212 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     666.23 ms /   281 tokens (    2.37 ms per token,   421.78 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     668.92 ms /   282 tokens


6 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     368.02 ms /   164 tokens (    2.24 ms per token,   445.63 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     370.12 ms /   165 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     729.56 ms /   297 tokens (    2.46 ms per token,   407.09 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     732.01 ms /   298 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     737.19 ms /   330 tokens (    2.23 ms per token,   447.64 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     739.95 ms /   331 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     516.71 ms /   240 tokens (    2.15 ms per token,   464.48 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     518.87 ms /   241 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     583.60 ms /   246 tokens (    2.37 ms per token,   421.52 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     585.59 ms /   247 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     696.78 ms /   297 tokens (    2.35 ms per token,   426.25 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     699.04 ms /   298 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     593.39 ms /   254 tokens (    2.34 ms per token,   428.05 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     595.33 ms /   255 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     583.59 ms /   250 tokens (    2.33 ms per token,   428.38 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     585.23 ms /   251 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     729.23 ms /   311 tokens (    2.34 ms per token,   426.48 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     732.35 ms /   312 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     682.52 ms /   214 tokens (    3.19 ms per token,   313.55 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     684.81 ms /   215 tokens


1 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     533.09 ms /   209 tokens (    2.55 ms per token,   392.06 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     536.42 ms /   210 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     640.62 ms /   256 tokens (    2.50 ms per token,   399.61 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     642.91 ms /   257 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     772.99 ms /   299 tokens (    2.59 ms per token,   386.81 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     775.79 ms /   300 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     828.74 ms /   318 tokens (    2.61 ms per token,   383.71 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     830.24 ms /   319 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     602.38 ms /   250 tokens (    2.41 ms per token,   415.02 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     603.88 ms /   251 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     414.34 ms /   176 tokens (    2.35 ms per token,   424.77 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     417.66 ms /   177 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     794.15 ms /   308 tokens (    2.58 ms per token,   387.83 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     795.78 ms /   309 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     504.05 ms /   211 tokens (    2.39 ms per token,   418.61 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     506.06 ms /   212 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     622.61 ms /   262 tokens (    2.38 ms per token,   420.81 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     624.72 ms /   263 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     782.02 ms /   323 tokens (    2.42 ms per token,   413.03 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     785.07 ms /   324 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     620.00 ms /   255 tokens (    2.43 ms per token,   411.29 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     621.91 ms /   256 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     591.58 ms /   256 tokens (    2.31 ms per token,   432.74 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     593.85 ms /   257 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     332.18 ms /   148 tokens (    2.24 ms per token,   445.54 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     335.37 ms /   149 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     757.56 ms /   309 tokens (    2.45 ms per token,   407.89 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     759.68 ms /   310 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     898.14 ms /   308 tokens (    2.92 ms per token,   342.93 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     899.81 ms /   309 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     861.68 ms /   312 tokens (    2.76 ms per token,   362.08 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     863.76 ms /   313 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     465.12 ms /   216 tokens (    2.15 ms per token,   464.40 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     467.56 ms /   217 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     571.97 ms /   247 tokens (    2.32 ms per token,   431.84 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     574.82 ms /   248 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     352.27 ms /   163 tokens (    2.16 ms per token,   462.72 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     354.10 ms /   164 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     639.62 ms /   281 tokens (    2.28 ms per token,   439.32 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     642.27 ms /   282 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     504.81 ms /   235 tokens (    2.15 ms per token,   465.52 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     507.22 ms /   236 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     610.48 ms /   235 tokens (    2.60 ms per token,   384.94 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     614.41 ms /   236 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     589.06 ms /   253 tokens (    2.33 ms per token,   429.50 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     591.72 ms /   254 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     743.24 ms /   319 tokens (    2.33 ms per token,   429.20 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     745.88 ms /   320 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     418.97 ms /   183 tokens (    2.29 ms per token,   436.78 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     421.74 ms /   184 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     581.57 ms /   263 tokens (    2.21 ms per token,   452.23 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     583.85 ms /   264 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     607.52 ms /   268 tokens (    2.27 ms per token,   441.13 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     610.17 ms /   269 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =    1196.18 ms /   512 tokens (    2.34 ms per token,   428.03 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =    1199.60 ms /   513 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     312.09 ms /   123 tokens (    2.54 ms per token,   394.11 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     314.60 ms /   124 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     569.64 ms /   243 tokens (    2.34 ms per token,   426.59 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     571.88 ms /   244 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     693.73 ms /   296 tokens (    2.34 ms per token,   426.68 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     696.37 ms /   297 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     506.16 ms /   235 tokens (    2.15 ms per token,   464.28 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     508.84 ms /   236 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     864.72 ms /   362 tokens (    2.39 ms per token,   418.63 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     867.44 ms /   363 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     483.88 ms /   217 tokens (    2.23 ms per token,   448.45 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     485.94 ms /   218 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     631.63 ms /   212 tokens (    2.98 ms per token,   335.64 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     633.93 ms /   213 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     901.41 ms /   390 tokens (    2.31 ms per token,   432.66 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     903.52 ms /   391 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     571.89 ms /   265 tokens (    2.16 ms per token,   463.38 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     574.74 ms /   266 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =    2442.27 ms /   348 tokens (    7.02 ms per token,   142.49 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =    2445.33 ms /   349 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     791.39 ms /   296 tokens (    2.67 ms per token,   374.03 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     794.16 ms /   297 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     870.25 ms /   327 tokens (    2.66 ms per token,   375.75 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     872.45 ms /   328 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     786.89 ms /   269 tokens (    2.93 ms per token,   341.85 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     789.18 ms /   270 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     690.87 ms /   269 tokens (    2.57 ms per token,   389.36 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     693.32 ms /   270 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =    1144.53 ms /   381 tokens (    3.00 ms per token,   332.89 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =    1146.95 ms /   382 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     562.65 ms /   259 tokens (    2.17 ms per token,   460.32 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     565.35 ms /   260 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     763.50 ms /   319 tokens (    2.39 ms per token,   417.82 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     766.02 ms /   320 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     753.85 ms /   313 tokens (    2.41 ms per token,   415.20 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     756.24 ms /   314 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     344.06 ms /   157 tokens (    2.19 ms per token,   456.32 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     345.89 ms /   158 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     413.99 ms /   184 tokens (    2.25 ms per token,   444.45 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     416.00 ms /   185 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     633.33 ms /   282 tokens (    2.25 ms per token,   445.26 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     636.09 ms /   283 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     437.69 ms /   199 tokens (    2.20 ms per token,   454.66 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     440.38 ms /   200 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     477.53 ms /   217 tokens (    2.20 ms per token,   454.42 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     479.50 ms /   218 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     888.25 ms /   388 tokens (    2.29 ms per token,   436.81 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     890.96 ms /   389 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     432.23 ms /   204 tokens (    2.12 ms per token,   471.98 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     434.39 ms /   205 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     761.74 ms /   316 tokens (    2.41 ms per token,   414.84 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     764.20 ms /   317 tokens


1 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     910.89 ms /   391 tokens (    2.33 ms per token,   429.25 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     913.38 ms /   392 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     710.80 ms /   305 tokens (    2.33 ms per token,   429.10 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     713.81 ms /   306 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     625.12 ms /   281 tokens (    2.22 ms per token,   449.51 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     627.25 ms /   282 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     731.97 ms /   311 tokens (    2.35 ms per token,   424.88 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     734.98 ms /   312 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     690.50 ms /   297 tokens (    2.32 ms per token,   430.12 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     692.76 ms /   298 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     694.07 ms /   305 tokens (    2.28 ms per token,   439.44 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     697.02 ms /   306 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     481.11 ms /   221 tokens (    2.18 ms per token,   459.35 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     483.93 ms /   222 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     457.14 ms /   210 tokens (    2.18 ms per token,   459.37 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     459.74 ms /   211 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     423.76 ms /   198 tokens (    2.14 ms per token,   467.25 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     426.72 ms /   199 tokens


6 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     274.61 ms /   117 tokens (    2.35 ms per token,   426.06 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     276.69 ms /   118 tokens


1 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     303.31 ms /   134 tokens (    2.26 ms per token,   441.79 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     305.34 ms /   135 tokens


1 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     731.56 ms /   331 tokens (    2.21 ms per token,   452.46 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     734.09 ms /   332 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     488.05 ms /   201 tokens (    2.43 ms per token,   411.84 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     490.43 ms /   202 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     581.88 ms /   266 tokens (    2.19 ms per token,   457.14 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     584.47 ms /   267 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     358.96 ms /   165 tokens (    2.18 ms per token,   459.66 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     361.31 ms /   166 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     592.30 ms /   271 tokens (    2.19 ms per token,   457.54 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     594.52 ms /   272 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     439.73 ms /   193 tokens (    2.28 ms per token,   438.91 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     441.87 ms /   194 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     376.13 ms /   172 tokens (    2.19 ms per token,   457.29 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     378.16 ms /   173 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     527.75 ms /   233 tokens (    2.27 ms per token,   441.49 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     530.69 ms /   234 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     945.92 ms /   331 tokens (    2.86 ms per token,   349.93 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     948.63 ms /   332 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     749.96 ms /   289 tokens (    2.60 ms per token,   385.35 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     752.38 ms /   290 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     685.72 ms /   288 tokens (    2.38 ms per token,   420.00 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     688.85 ms /   289 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     589.23 ms /   241 tokens (    2.44 ms per token,   409.01 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     591.66 ms /   242 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     683.61 ms /   261 tokens (    2.62 ms per token,   381.80 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     686.37 ms /   262 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     726.63 ms /   313 tokens (    2.32 ms per token,   430.76 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     729.58 ms /   314 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     711.57 ms /   284 tokens (    2.51 ms per token,   399.12 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     713.66 ms /   285 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =    1010.48 ms /   361 tokens (    2.80 ms per token,   357.25 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =    1012.41 ms /   362 tokens


6 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     603.77 ms /   258 tokens (    2.34 ms per token,   427.31 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     605.10 ms /   259 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     632.06 ms /   277 tokens (    2.28 ms per token,   438.25 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     634.15 ms /   278 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     649.94 ms /   290 tokens (    2.24 ms per token,   446.19 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     651.69 ms /   291 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     594.78 ms /   260 tokens (    2.29 ms per token,   437.14 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     596.51 ms /   261 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     590.74 ms /   269 tokens (    2.20 ms per token,   455.36 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     592.11 ms /   270 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     552.81 ms /   212 tokens (    2.61 ms per token,   383.50 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     554.13 ms /   213 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     481.19 ms /   210 tokens (    2.29 ms per token,   436.41 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     482.73 ms /   211 tokens


1 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     590.95 ms /   248 tokens (    2.38 ms per token,   419.66 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     592.41 ms /   249 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     370.22 ms /   154 tokens (    2.40 ms per token,   415.97 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     372.45 ms /   155 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     330.48 ms /   160 tokens (    2.07 ms per token,   484.15 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     332.82 ms /   161 tokens


7 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     665.15 ms /   295 tokens (    2.25 ms per token,   443.51 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     667.37 ms /   296 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     548.51 ms /   256 tokens (    2.14 ms per token,   466.72 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     550.66 ms /   257 tokens


0 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     433.20 ms /   197 tokens (    2.20 ms per token,   454.76 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     435.65 ms /   198 tokens


2 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     705.55 ms /   259 tokens (    2.72 ms per token,   367.09 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     708.27 ms /   260 tokens


5 / 14



llama_print_timings:        load time =      90.62 ms
llama_print_timings:      sample time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings: prompt eval time =     694.08 ms /   296 tokens (    2.34 ms per token,   426.46 tokens per second)
llama_print_timings:        eval time =       0.00 ms /     1 runs   (    0.00 ms per token,      inf tokens per second)
llama_print_timings:       total time =     696.52 ms /   297 tokens


7 / 14
