In [7]:
import pandas as pd
import os
from pathlib import Path
import glob

# Auto-discovery of latest Phase 3.5 data
datasets_dir = "../data/phase3_5/"
pattern = os.path.join(datasets_dir, "dataset_temp_*.parquet")
matching_files = glob.glob(pattern)

if matching_files:
    # Sort by modification time, newest first
    matching_files.sort(key=lambda x: os.path.getmtime(x), reverse=True)
    print(f"🔍 Found {len(matching_files)} temperature files (newest first)")
    for file in matching_files:
        print(f"  📁 {Path(file).name}")
else:
    raise FileNotFoundError(f"No temperature dataset files found in {datasets_dir}")

🔍 Found 5 temperature files (newest first)
  📁 dataset_temp_0_6.parquet
  📁 dataset_temp_1_2.parquet
  📁 dataset_temp_0_9.parquet
  📁 dataset_temp_0_3.parquet
  📁 dataset_temp_0_0.parquet


In [8]:
# Load and display first 5 records for each temperature dataset
for file_path in matching_files:
    file_name = Path(file_path).name
    print(f"\n{'='*50}")
    print(f"Dataset: {file_name}")
    print(f"{'='*50}")
    
    df = pd.read_parquet(file_path)
    print(f"Records: {len(df)}")
    print(f"Columns: {list(df.columns)}")
    print("\nFirst 5 records:")
    display(df.head(50))


Dataset: dataset_temp_0_6.parquet
Records: 60
Columns: ['task_id', 'temperature', 'prompt', 'generated_code', 'test_passed', 'error_message', 'generation_time', 'cyclomatic_complexity', 'generation_idx']

First 5 records:


Unnamed: 0,task_id,temperature,prompt,generated_code,test_passed,error_message,generation_time,cyclomatic_complexity,generation_idx
0,1,0.6,Write a Python function to solve the following...,"def min_cost(cost, m, n):\n # Your code her...",False,,29.381733,7,0
1,1,0.6,Write a Python function to solve the following...,"def min_cost(cost, m, n):\n\n# Your code here\...",False,,11.851039,7,1
2,1,0.6,Write a Python function to solve the following...,"def min_cost(cost, m, n):\n # Write your co...",False,,33.136135,7,2
3,5,0.6,Write a Python function to solve the following...,# Solution:\ndef count_ways(n):\n if n == 1...,False,,22.800214,2,0
4,5,0.6,Write a Python function to solve the following...,def count_ways(n):\n return 0\n\n# Test cod...,False,,9.309174,2,1
5,5,0.6,Write a Python function to solve the following...,# Function definition\ndef count_ways(n):\n ...,False,,12.254187,2,2
6,8,0.6,Write a Python function to solve the following...,def square_nums(nums):,False,,1.98659,1,0
7,8,0.6,Write a Python function to solve the following...,def square_nums(nums):\n return [lambda x: ...,False,,4.100458,1,1
8,8,0.6,Write a Python function to solve the following...,def square_nums(nums):\n return [x**2 for x...,True,,3.648428,1,2
9,10,0.6,Write a Python function to solve the following...,"def small_nnum(dataSet,n):\n """"""\n This ...",False,,22.197321,1,0



Dataset: dataset_temp_1_2.parquet
Records: 50
Columns: ['task_id', 'temperature', 'prompt', 'generated_code', 'test_passed', 'error_message', 'generation_time', 'cyclomatic_complexity', 'generation_idx']

First 5 records:


Unnamed: 0,task_id,temperature,prompt,generated_code,test_passed,error_message,generation_time,cyclomatic_complexity,generation_idx
0,1,1.2,Write a Python function to solve the following...,import functools\n\ndef min(x):\n functools...,False,,25.437566,7,0
1,1,1.2,Write a Python function to solve the following...,'''This code will calculate the path from the ...,False,,46.358381,7,1
2,1,1.2,Write a Python function to solve the following...,"def min_cost(cost, destination, n):\n\nIf you ...",False,,41.394968,7,2
3,1,1.2,Write a Python function to solve the following...,function code for min_cost()\nimport numpy as ...,False,,44.331651,7,3
4,1,1.2,Write a Python function to solve the following...,"def min_cost(cost, m, n):\n for i in range(...",False,,18.396529,7,4
5,5,1.2,Write a Python function to solve the following...,"import unittest\n\ndef count_ways(rows, cols) ...",False,,6.213836,2,0
6,5,1.2,Write a Python function to solve the following...,Note:\nDon't reinvent the solution for DP!\n\n...,False,,101.822943,2,1
7,5,1.2,Write a Python function to solve the following...,def count_ways(n):,False,,2.016571,2,2
8,5,1.2,Write a Python function to solve the following...,,False,,0.320443,2,3
9,5,1.2,Write a Python function to solve the following...,def count_ways(n):\n# base case\nif n >= 1:\n#...,False,,20.159765,2,4



Dataset: dataset_temp_0_9.parquet
Records: 50
Columns: ['task_id', 'temperature', 'prompt', 'generated_code', 'test_passed', 'error_message', 'generation_time', 'cyclomatic_complexity', 'generation_idx']

First 5 records:


Unnamed: 0,task_id,temperature,prompt,generated_code,test_passed,error_message,generation_time,cyclomatic_complexity,generation_idx
0,1,0.9,Write a Python function to solve the following...,"def min_cost(costs, m, n):\n # Function to f...",False,,409.007721,7,0
1,1,0.9,Write a Python function to solve the following...,"min_cost(cost_matrix, m, n):\n # Check if t...",False,,15.275557,7,1
2,1,0.9,Write a Python function to solve the following...,"def min_cost(cost, m, n):\n m, n = 10, 4\n ...",False,,315.441344,7,2
3,1,0.9,Write a Python function to solve the following...,"def min_cost(cost, m, n):\n if m < 0 or m >...",False,,28.833237,7,3
4,1,0.9,Write a Python function to solve the following...,"def min_cost(cost, m, n):\n # Calculate num...",False,,200.918921,7,4
5,5,0.9,Write a Python function to solve the following...,def count_ways(n):\n return\n\n# Return the...,False,,5.949788,2,0
6,5,0.9,Write a Python function to solve the following...,def count_ways(length):\nreturn 0\n\n# Test th...,False,,9.234527,2,1
7,5,0.9,Write a Python function to solve the following...,,False,,0.324869,2,2
8,5,0.9,Write a Python function to solve the following...,from math import factorial\ndef count_ways(n):...,False,,192.334744,2,3
9,5,0.9,Write a Python function to solve the following...,"class Solution:\n """"""\n @param dominoes:...",False,,96.731005,2,4



Dataset: dataset_temp_0_3.parquet
Records: 50
Columns: ['task_id', 'temperature', 'prompt', 'generated_code', 'test_passed', 'error_message', 'generation_time', 'cyclomatic_complexity', 'generation_idx']

First 5 records:


Unnamed: 0,task_id,temperature,prompt,generated_code,test_passed,error_message,generation_time,cyclomatic_complexity,generation_idx
0,1,0.3,Write a Python function to solve the following...,"def min_cost(cost, m, n):\n # Your code her...",False,,30.142816,7,0
1,1,0.3,Write a Python function to solve the following...,"def min_cost(cost, m, n):\n # Your code her...",False,,4.318848,7,1
2,1,0.3,Write a Python function to solve the following...,"def min_cost(cost, m, n):\n # Write your co...",False,,24.402323,7,2
3,1,0.3,Write a Python function to solve the following...,"def min_cost(cost, m, n):\n # Write your co...",False,,24.097416,7,3
4,1,0.3,Write a Python function to solve the following...,"def min_cost(cost, m, n):\n # Your code her...",False,,4.014662,7,4
5,5,0.3,Write a Python function to solve the following...,def count_ways(n):\n if n == 1:\n re...,False,,412.710801,2,0
6,5,0.3,Write a Python function to solve the following...,def count_ways(n):\n\n# Your code here:\nretur...,False,,3.885333,2,1
7,5,0.3,Write a Python function to solve the following...,def count_ways(n):\n if n == 1:\n re...,False,,12.791249,2,2
8,5,0.3,Write a Python function to solve the following...,def count_ways(n):\n return 0\n\n# Test cod...,False,,9.233836,2,3
9,5,0.3,Write a Python function to solve the following...,def count_ways(n):\n # Your code here:\n ...,False,,3.250301,2,4



Dataset: dataset_temp_0_0.parquet
Records: 50
Columns: ['task_id', 'temperature', 'prompt', 'generated_code', 'test_passed', 'error_message', 'generation_time', 'cyclomatic_complexity', 'generation_idx']

First 5 records:


Unnamed: 0,task_id,temperature,prompt,generated_code,test_passed,error_message,generation_time,cyclomatic_complexity,generation_idx
0,1,0.0,Write a Python function to solve the following...,"def min_cost(cost, m, n):\n # Write your co...",False,,29.545906,7,0
1,5,0.0,Write a Python function to solve the following...,def count_ways(n):\n if n == 1:\n re...,False,,405.833809,2,0
2,8,0.0,Write a Python function to solve the following...,def square_nums(nums):\n return [x**2 for x...,True,,4.439466,1,0
3,10,0.0,Write a Python function to solve the following...,"def small_nnum(num_list, n):\n # Your code ...",False,,5.269413,1,0
4,14,0.0,Write a Python function to solve the following...,"def find_Volume(base, height, width):\n ret...",False,,5.222691,1,0
5,17,0.0,Write a Python function to solve the following...,def square_perimeter(side):\n return side**2,False,,5.013457,1,0
6,18,0.0,Write a Python function to solve the following...,"def remove_dirty_chars(s1, s2):\n return s1...",False,,5.303037,3,0
7,20,0.0,Write a Python function to solve the following...,def is_woodall(number):\n if number % 2 == ...,False,,6.730649,5,0
8,21,0.0,Write a Python function to solve the following...,"def multiples_of_num(num, n):\n return [i f...",False,,6.265986,1,0
9,22,0.0,Write a Python function to solve the following...,def find_first_duplicate(arr):\n for i in r...,True,,10.498238,3,0
