In [None]:
import numpy as np
from src.logprobs import collect_logprobs


In [6]:
# Define temperature settings: 10^(-2, -1.5, -1, -0.5, 0), 2
temperatures = [
    10**(-2),    # 0.01
    10**(-1.5),  # ~0.032
    10**(-1),    # 0.1
    10**(-0.5),  # ~0.316
    10**(0),     # 1.0
    2
]

print("Temperature settings:")
for i, temp in enumerate(temperatures):
    print(f"  {i+1}. {temp:.3f}")


Temperature settings:
  1. 0.010
  2. 0.032
  3. 0.100
  4. 0.316
  5. 1.000
  6. 2.000


In [7]:
# Prepare model parameters for each temperature
model_params = [{"batch_size": 32, "temperature": temp} for temp in temperatures]

print(f"Running GPT-2 with {len(model_params)} different temperature settings...")
print("Model parameters:")
for i, params in enumerate(model_params):
    print(f"  {i+1}. {params}")


Running GPT-2 with 6 different temperature settings...
Model parameters:
  1. {'batch_size': 32, 'temperature': 0.01}
  2. {'batch_size': 32, 'temperature': 0.03162277660168379}
  3. {'batch_size': 32, 'temperature': 0.1}
  4. {'batch_size': 32, 'temperature': 0.31622776601683794}
  5. {'batch_size': 32, 'temperature': 1}
  6. {'batch_size': 32, 'temperature': 2}


In [8]:
try:
    collect_logprobs(
        "data/data.json",
        models=[
            "openai-community/gpt2",
        ],
        model_params=model_params,
        model_provider="hf",
        param_mapping_strategy="combinations",
        save_results=True,
        save_path="data/temperature_logprobs.csv",
        verbose=True,
    )
    print("\nCompleted successfully! Results saved to data/temperature_logprobs.csv")
except Exception as e:
    print(f"Error: {e}")


Using combinations mapping: running each model with each parameter set and each model_kwargs set.


Processing models:   0%|          | 0/6 [00:00<?, ?it/s]


--- Processing Model: openai-community/gpt2 with provider: hf and params: {'batch_size': 32, 'temperature': 0.01} ---
Using HFInterface for openai-community/gpt2 with model_kwargs: {}
Initializing LLMInterface for model: openai-community/gpt2 with params: {'model_kwargs': {}, 'batch_size': 32, 'temperature': 0.01, 'verbose': True}
Initializing HFInterface for openai-community/gpt2
Using device: mps
Attempting to load model with identifier: 'openai-community/gpt2'
Model openai-community/gpt2 loaded successfully on mps.
Generated 9690 prompts for model openai-community/gpt2 with params {'batch_size': 32, 'temperature': 0.01}. Processing via HFInterface...
Using batch size: 32, temperature: 0.01 (from init params)
Preparing 9690 prompts for HF batching...
Sorting completed in 0.55 seconds.
Processing in 303 batches of size 32...


Processing batches: 100%|██████████| 303/303 [07:56<00:00,  1.57s/it]


Finished processing all batches for openai-community/gpt2.
Releasing HF model and tokenizer for openai-community/gpt2 from mps...
HF resources released.


Processing models:  17%|█▋        | 1/6 [07:59<39:57, 479.48s/it]

--- Finished processing Model: openai-community/gpt2 with params: {'batch_size': 32, 'temperature': 0.01} ---

--- Processing Model: openai-community/gpt2 with provider: hf and params: {'batch_size': 32, 'temperature': 0.03162277660168379} ---
Using HFInterface for openai-community/gpt2 with model_kwargs: {}
Initializing LLMInterface for model: openai-community/gpt2 with params: {'model_kwargs': {}, 'batch_size': 32, 'temperature': 0.03162277660168379, 'verbose': True}
Initializing HFInterface for openai-community/gpt2
Using device: mps
Attempting to load model with identifier: 'openai-community/gpt2'
Model openai-community/gpt2 loaded successfully on mps.
Generated 9690 prompts for model openai-community/gpt2 with params {'batch_size': 32, 'temperature': 0.03162277660168379}. Processing via HFInterface...
Using batch size: 32, temperature: 0.03162277660168379 (from init params)
Preparing 9690 prompts for HF batching...
Sorting completed in 0.60 seconds.
Processing in 303 batches of si

Processing batches: 100%|██████████| 303/303 [23:46<00:00,  4.71s/it]


Finished processing all batches for openai-community/gpt2.
Releasing HF model and tokenizer for openai-community/gpt2 from mps...


Processing models:  33%|███▎      | 2/6 [31:50<1:09:16, 1039.09s/it]

HF resources released.
--- Finished processing Model: openai-community/gpt2 with params: {'batch_size': 32, 'temperature': 0.03162277660168379} ---

--- Processing Model: openai-community/gpt2 with provider: hf and params: {'batch_size': 32, 'temperature': 0.1} ---
Using HFInterface for openai-community/gpt2 with model_kwargs: {}
Initializing LLMInterface for model: openai-community/gpt2 with params: {'model_kwargs': {}, 'batch_size': 32, 'temperature': 0.1, 'verbose': True}
Initializing HFInterface for openai-community/gpt2
Using device: mps
Attempting to load model with identifier: 'openai-community/gpt2'
Model openai-community/gpt2 loaded successfully on mps.
Generated 9690 prompts for model openai-community/gpt2 with params {'batch_size': 32, 'temperature': 0.1}. Processing via HFInterface...
Using batch size: 32, temperature: 0.1 (from init params)
Preparing 9690 prompts for HF batching...
Sorting completed in 0.67 seconds.
Processing in 303 batches of size 32...


Processing batches: 100%|██████████| 303/303 [19:38<00:00,  3.89s/it]


Finished processing all batches for openai-community/gpt2.
Releasing HF model and tokenizer for openai-community/gpt2 from mps...


Processing models:  50%|█████     | 3/6 [51:35<55:17, 1105.88s/it]  

HF resources released.
--- Finished processing Model: openai-community/gpt2 with params: {'batch_size': 32, 'temperature': 0.1} ---

--- Processing Model: openai-community/gpt2 with provider: hf and params: {'batch_size': 32, 'temperature': 0.31622776601683794} ---
Using HFInterface for openai-community/gpt2 with model_kwargs: {}
Initializing LLMInterface for model: openai-community/gpt2 with params: {'model_kwargs': {}, 'batch_size': 32, 'temperature': 0.31622776601683794, 'verbose': True}
Initializing HFInterface for openai-community/gpt2
Using device: mps
Attempting to load model with identifier: 'openai-community/gpt2'
Model openai-community/gpt2 loaded successfully on mps.
Generated 9690 prompts for model openai-community/gpt2 with params {'batch_size': 32, 'temperature': 0.31622776601683794}. Processing via HFInterface...
Using batch size: 32, temperature: 0.31622776601683794 (from init params)
Preparing 9690 prompts for HF batching...
Sorting completed in 0.70 seconds.
Processin

Processing batches: 100%|██████████| 303/303 [14:22<00:00,  2.85s/it]


Finished processing all batches for openai-community/gpt2.
Releasing HF model and tokenizer for openai-community/gpt2 from mps...


Processing models:  67%|██████▋   | 4/6 [1:06:01<33:42, 1011.25s/it]

HF resources released.
--- Finished processing Model: openai-community/gpt2 with params: {'batch_size': 32, 'temperature': 0.31622776601683794} ---

--- Processing Model: openai-community/gpt2 with provider: hf and params: {'batch_size': 32, 'temperature': 1} ---
Using HFInterface for openai-community/gpt2 with model_kwargs: {}
Initializing LLMInterface for model: openai-community/gpt2 with params: {'model_kwargs': {}, 'batch_size': 32, 'temperature': 1, 'verbose': True}
Initializing HFInterface for openai-community/gpt2
Using device: mps
Attempting to load model with identifier: 'openai-community/gpt2'
Model openai-community/gpt2 loaded successfully on mps.
Generated 9690 prompts for model openai-community/gpt2 with params {'batch_size': 32, 'temperature': 1}. Processing via HFInterface...
Using batch size: 32, temperature: 1 (from init params)
Preparing 9690 prompts for HF batching...
Sorting completed in 0.55 seconds.
Processing in 303 batches of size 32...


Processing batches: 100%|██████████| 303/303 [12:40<00:00,  2.51s/it]


Finished processing all batches for openai-community/gpt2.
Releasing HF model and tokenizer for openai-community/gpt2 from mps...


Processing models:  83%|████████▎ | 5/6 [1:18:45<15:21, 921.96s/it] 

HF resources released.
--- Finished processing Model: openai-community/gpt2 with params: {'batch_size': 32, 'temperature': 1} ---

--- Processing Model: openai-community/gpt2 with provider: hf and params: {'batch_size': 32, 'temperature': 2} ---
Using HFInterface for openai-community/gpt2 with model_kwargs: {}
Initializing LLMInterface for model: openai-community/gpt2 with params: {'model_kwargs': {}, 'batch_size': 32, 'temperature': 2, 'verbose': True}
Initializing HFInterface for openai-community/gpt2
Using device: mps
Attempting to load model with identifier: 'openai-community/gpt2'
Model openai-community/gpt2 loaded successfully on mps.
Generated 9690 prompts for model openai-community/gpt2 with params {'batch_size': 32, 'temperature': 2}. Processing via HFInterface...
Using batch size: 32, temperature: 2 (from init params)
Preparing 9690 prompts for HF batching...
Sorting completed in 0.57 seconds.
Processing in 303 batches of size 32...


Processing batches: 100%|██████████| 303/303 [13:39<00:00,  2.70s/it]


Finished processing all batches for openai-community/gpt2.
Releasing HF model and tokenizer for openai-community/gpt2 from mps...
HF resources released.


Processing models: 100%|██████████| 6/6 [1:32:27<00:00, 924.58s/it]

--- Finished processing Model: openai-community/gpt2 with params: {'batch_size': 32, 'temperature': 2} ---





Saving results to data/temperature_logprobs.csv...

Completed successfully! Results saved to data/temperature_logprobs.csv
