In [None]:
import os
import time
import config
from datetime import datetime
import ollama
from codecarbon import EmissionsTracker
from log_utils import read_log_messages, normalize_template, normalize_template_v1, normalize_template_v2, save_templates
from ollama_utils import start_ollama_server, stop_ollama_server, start_ollama_server_log
from evaluation import evaluate_and_save

In [None]:
llm_config = config.LLM_CONFIG
task = config.TASK_PROMPT
sys_prompt_few_shot_single_log_parser = config.SYS_MSG_SINGLE_LOG_PARSER_FEW_SHOT
sys_prompt_three_shot_single_log_parser = config.SYS_MSG_SINGLE_LOG_PARSER_THREE_SHOT
sys_prompt_zero_shot_single_log_parser = config.SYS_MSG_SINGLE_LOG_PARSER_ZERO_SHOT

LOG_DIR = config.LOG_DIR
RESULT_DIR = config.RESULT_DIR
if not os.path.exists(RESULT_DIR):
    os.makedirs(RESULT_DIR)

input_log_file = "HDFS_200_sampled.log"
log_path = os.path.join(LOG_DIR, input_log_file)
ground_truth_file_path = os.path.join(LOG_DIR, "HDFS_200_sampled_log_structured.csv")

DESIGN = "NA-zero"

model_name = llm_config["config_list"][0]["model"]
model = llm_config["config_list"][0]["model"].replace(":", "-")
temperature = llm_config["temperature"] 
timestamp = datetime.now().strftime("%Y%m%d-%H%M%S")
project_name = DESIGN.capitalize()
exp_name = f"{project_name}_{model}_{timestamp}"

In [None]:
# --- Ollama Query Function ---
def ask_ollama(model, prompt):
    try:
        response = ollama.generate(
            model=model,
            prompt=prompt,
            options={'temperature': temperature}
        )
    except ollama.ResponseError as e:
        print('Error:', e.error)
        return None
    return response.get('response', None)

# --- Read Log Messages ---
logs = read_log_messages(log_path)

With CodeCarbon

In [None]:
# --- With CodeCarbon ---
def run_inference_with_emissions(logs, model_name, prompt_prefix, task, exp_name, result_dir):
    parsed_templates = []
    tracker = EmissionsTracker(project_name=exp_name, output_dir=result_dir, save_to_file=True)
    tracker.start()
    try:
        for i, log_message in enumerate(logs):
            #print(f"Processing log {i+1}/{len(logs)}")
            prompt = prompt_prefix + task + log_message
            response = ask_ollama(model_name, prompt)
            if response is not None:
                parsed_templates.append(response)
                
            else:
                print(f"[Warning] Skipped log {i} — no response or invalid format.")
    finally:
        emissions = tracker.stop()
    print(f"Emissions: {emissions} kg CO2")
    return parsed_templates


In [None]:
proc = start_ollama_server()
time.sleep(5) # Give it some time to initialize
parsed_templates = run_inference_with_emissions(logs, model_name, sys_prompt_zero_shot_single_log_parser, task, exp_name, RESULT_DIR)
save_templates(parsed_templates, llm_config, DESIGN, RESULT_DIR)
stop_ollama_server(proc)

In [None]:
# --- Print Results ---
#print("Templates:", parsed_templates)


Evaluate Accuracy

In [None]:
# using normalize_template
results = evaluate_and_save(normalize_template, parsed_templates, ground_truth_file_path, exp_name)
# using normalize_template_v1
results_v1 = evaluate_and_save(normalize_template_v1, parsed_templates, ground_truth_file_path, exp_name)
# using normalize_template_v2
results_v2 = evaluate_and_save(normalize_template_v2, parsed_templates, ground_truth_file_path, exp_name)

In [None]:
#print("Results:", results)