In [1]:
import itertools

import pandas as pd
from generation import GenerationConfig

  from .autonotebook import tqdm as notebook_tqdm


In [2]:
source = [
    'Franklin/full_study.jsonl',
    'GSM8k/test.jsonl',
    'HotpotQA/hotpot_test_fullwiki_v1.jsonl',
    'StrategyQA/dev_decomp_3_plus.jsonl',
]
models = [
    'google/gemma-2-9b-it',
    'meta-llama/Meta-Llama-3.1-8B-Instruct',
    'microsoft/Phi-3.5-mini-instruct',
    'openai/gpt-4o-mini',
]
description = 'final-study'
save = True
batch_size = 8
examples = 64
temperature = 0.2
system_content = [
    'Create a step-by-step plan for finding the answer to the following problem. Do not answer the question. Do not perform the actions in the plan. Your only task is to outline the steps involved in a concise and clear manner.',
    'Now perform the steps in the plan you created. Use the most precise, accurate and up-to-date information available. To save space, be concise when describing the actions. Conclude by stating the answer that you reached by following the steps you outlined.',
]


In [3]:
# list of dicts of generation configurations
configs = []
for s, m in itertools.product(source, models):
    config = GenerationConfig(
        source=s,
        model=m,
        description=description,
        save=save,
        batch_size=batch_size,
        examples=examples,
        temperature=temperature,
        system_content=system_content,
    )
    configs.append(config)

# save the configurations
pd.DataFrame([config.__dict__ for config in configs]).to_json('queue.jsonl', orient='records', lines=True)