# Phase 3.6 Hyperparameter Dataset Checker

This notebook checks the Phase 3.6 hyperparameter data and displays the first 10 rows.

In [1]:
import pandas as pd
from pathlib import Path
import glob

# Find the data directory
data_dir = Path("../data/phase3_6")
print(f"Looking for hyperparameter data in: {data_dir.absolute()}")

pd.set_option('display.max_colwidth', None)  # Show full column content
pd.set_option('display.max_columns', None)   # Show all columns
pd.set_option('display.max_rows', None)      # Show all rows (be careful with large datasets)
pd.set_option('display.width', None)         # Don't wrap to multiple lines

Looking for hyperparameter data in: /Users/krizroycetahimic/Documents/Thesis/Code/pva_sae/phase3_6/../data/phase3_6


In [2]:
# Find parquet files using autodiscovery
parquet_files = list(data_dir.glob("*.parquet"))
parquet_files.sort(key=lambda x: x.stat().st_mtime, reverse=True)

if not parquet_files:
    print("No parquet files found!")
else:
    print(f"Found {len(parquet_files)} parquet files:")
    for file in parquet_files:
        print(f"  - {file.name}")
    
    # Load the first (most recent) file
    latest_file = parquet_files[0]
    print(f"\nUsing file: {latest_file.name}")
    
    df = pd.read_parquet(latest_file)
    print(f"\nDataset shape: {df.shape}")
    print(f"Columns: {df.columns.tolist()}")
    print("\nFirst 10 rows:")
    display(df.head(10))

Found 1 parquet files:
  - dataset_hyperparams_temp_0_0.parquet

Using file: dataset_hyperparams_temp_0_0.parquet

Dataset shape: (10, 9)
Columns: ['task_id', 'temperature', 'prompt', 'generated_code', 'test_passed', 'error_message', 'generation_time', 'cyclomatic_complexity', 'test_list']

First 10 rows:


Unnamed: 0,task_id,temperature,prompt,generated_code,test_passed,error_message,generation_time,cyclomatic_complexity,test_list
0,28,0.0,"Write a python function to find binomial co-efficient.\n\nassert assert binomial_Coeff(5,2) == 10\nassert assert binomial_Coeff(4,3) == 4\nassert assert binomial_Coeff(3,2) == 3\n\n# Solution:","def binomial_Coeff(n, k):\n if k > n:\n return 0\n if k == 0 or k == n:\n return 1\n return binomial_Coeff(n-1, k-1) + binomial_Coeff(n-1, k)",True,,8.665597,4,"[""assert binomial_Coeff(5,2) == 10"", ""assert binomial_Coeff(4,3) == 4"", ""assert binomial_Coeff(3,2) == 3""]"
1,42,0.0,"Write a python function to find the sum of repeated elements in a given array.\n\nassert assert find_Sum([1,2,3,1,1,4,5,6],8) == 3\nassert assert find_Sum([1,2,3,1,1],5) == 3\nassert assert find_Sum([1,1,2],3) == 2\n\n# Solution:","def find_Sum(arr, n):\n sum = 0\n for i in range(n):\n if arr[i] == n:\n sum += 1\n return sum",False,,5.511933,3,"[""assert find_Sum([1,2,3,1,1,4,5,6],8) == 3"", ""assert find_Sum([1,2,3,1,1],5) == 3"", ""assert find_Sum([1,1,2],3) == 2""]"
2,53,0.0,"Write a python function to check whether the first and last characters of a given string are equal or not.\n\nassert assert check_Equality(""abcda"") == ""Equal""\nassert assert check_Equality(""ab"") == ""Not Equal""\nassert assert check_Equality(""mad"") == ""Not Equal""\n\n# Solution:","def check_Equality(string):\n if string[0] == string[-1]:\n return ""Equal""\n else:\n return ""Not Equal""",True,,4.375003,2,"[""assert check_Equality(\""abcda\"") == \""Equal\"""", ""assert check_Equality(\""ab\"") == \""Not Equal\"""", ""assert check_Equality(\""mad\"") == \""Not Equal\""""]"
3,65,0.0,"Write a function of recursion list sum.\n\nassert assert recursive_list_sum(([1, 2, [3,4],[5,6]]))==21\nassert assert recursive_list_sum(([7, 10, [15,14],[19,41]]))==106\nassert assert recursive_list_sum(([10, 20, [30,40],[50,60]]))==210\n\n# Solution:",def recursive_list_sum(list):\n if len(list)==0:\n return 0\n else:\n return list[0]+recursive_list_sum(list[1:]),False,,5.740386,3,"[""assert recursive_list_sum(([1, 2, [3,4],[5,6]]))==21"", ""assert recursive_list_sum(([7, 10, [15,14],[19,41]]))==106"", ""assert recursive_list_sum(([10, 20, [30,40],[50,60]]))==210""]"
4,67,0.0,Write a function to find the number of ways to partition a set of bell numbers.\n\nassert assert bell_number(2)==2\nassert assert bell_number(10)==115975\nassert assert bell_number(56)==6775685320645824322581483068371419745979053216268760300\n\n# Solution:,def bell_number(n):\n if n == 0:\n return 1\n if n == 1:\n return 1\n if n == 2:\n return 2\n if n == 3:\n return 5\n if n == 4:\n return 14\n if n == 5:\n return 42\n if n == 6:\n return 132\n if n == 7:\n return 429\n if n == 8:\n return 1433\n if n == 9:\n return 4862\n if n == 10:\n return 16796\n if n == 11:\n return 58786\n if n == 12:\n return 208012\n if n == 13:\n return 705122\n if n == 14:\n return 2363490\n if n == 15:\n return 8505102\n if n == 16:\n return 30437276\n if n == 17:\n return 110653730\n if n == 18:\n return 403294150\n if n == 19:\n return 1460614150\n if n == 20:\n return 5413944500\n if n == 21:\n return 20098386900\n if n == 22:\n return 75221809800\n if n == 23:\n return 281427498900\n if n == 24:\n return 1120930408800\n if n == 25:\n return 4450700969600\n if n == 26:\n return 17716623225600\n if n == 27:\n return 75866264643200\n if n == 28:\n return 331687521328000\n if n == 29:\n return 1451121046528000\n if n == 30:\n return 650412864320000\n if n == 31:\n return 2823291531520000\n if n == 32:\n return 13076743686400000\n if n == 33:\n return 60414515264640000\n if n == 34:\n return 251745132867680000\n if n == 35:\n return 1109405604297920000\n if n == 36:\n return 4608013521474560000\n if n == 37:\n return 20160276607388800000\n if n == 38:\n return 9072149134646400000\n if n == 39:\n return 43041474613288000000\n if n == 40:\n return 20515411226566400000\n if n == 41:\n return 102073066453136000000\n if n == 42:\n return 51052633226584000000\n if n == 43:\n return 255051166132960000000\n if n == 44:\n return 127510583066480000000\n if n == 45:\n return 63755291533280000000\n if n == 46:\n return 31876845766560000000\n if n == 47:\n return 159384228832800000000\n if n == 48:\n return 80692114416400000000\n if n == 49:\n return 40346057208000000000\n if n == 50:\n return 20173028604000000000\n if n == 51:\n return 100915143200000000000\n if n == 52:\n return 50457071600000000000\n if n == 53:\n return 252285358000000000000\n if n == 54:\n return 126143679000000000000\n if n == 55:\n return 63071839500000000000\n if n == 56:\n return 31535919750000000000\n if n == 57:\n return 157674598750000000000\n if n == 58:\n return 88837299375000000000\n if n == 59:\n return 44418649687500000000\n if n == 60:\n return 22209324843750000000\n if n == 61:\n return 111046624218750000000\n if n == 62:\n return 55523312109375000000\n if n == 63:\n return 27761666054687500000\n if n == 64:\n return 13880833027843750000\n if n == 65:\n return 74404165139218750000\n if n == 66:\n return 37202082569609375000\n if n == 67:\n return 18601041284801875000\n if n == 68:\n return 93005206424009375000\n if n == 69:\n return 46502603212004687500\n if n == 70:\n return 23251301606002343750\n if n == 71:\n return 11625650803001171875\n if n == 72:\n return 5,False,,327.477631,5,"[""assert bell_number(2)==2"", ""assert bell_number(10)==115975"", ""assert bell_number(56)==6775685320645824322581483068371419745979053216268760300""]"
5,68,0.0,"Write a python function to check whether the given array is monotonic or not.\n\nassert assert is_Monotonic([6, 5, 4, 4]) == True\nassert assert is_Monotonic([1, 2, 2, 3]) == True\nassert assert is_Monotonic([1, 3, 2]) == False\n\n# Solution:","def is_Monotonic(arr):\n if len(arr) < 2:\n return True\n if arr[0] > arr[1]:\n return False\n for i in range(1, len(arr) - 1):\n if arr[i] > arr[i + 1]:\n return False\n return True",False,,9.808707,4,"[""assert is_Monotonic([6, 5, 4, 4]) == True"", ""assert is_Monotonic([1, 2, 2, 3]) == True"", ""assert is_Monotonic([1, 3, 2]) == False""]"
6,69,0.0,"Write a function to check whether a list contains the given sublist or not.\n\nassert assert is_sublist([2,4,3,5,7],[3,7])==False\nassert assert is_sublist([2,4,3,5,7],[4,3])==True\nassert assert is_sublist([2,4,3,5,7],[1,6])==False\n\n# Solution:","def is_sublist(l1,l2):\n if len(l1) < len(l2):\n return False\n for i in range(len(l1)):\n if l1[i] in l2:\n return True\n return False",False,,8.076892,9,"[""assert is_sublist([2,4,3,5,7],[3,7])==False"", ""assert is_sublist([2,4,3,5,7],[4,3])==True"", ""assert is_sublist([2,4,3,5,7],[1,6])==False""]"
7,75,0.0,"Write a function to find tuples which have all elements divisible by k from the given list of tuples.\n\nassert assert find_tuples([(6, 24, 12), (7, 9, 6), (12, 18, 21)], 6) == '[(6, 24, 12)]'\nassert assert find_tuples([(5, 25, 30), (4, 2, 3), (7, 8, 9)], 5) == '[(5, 25, 30)]'\nassert assert find_tuples([(7, 9, 16), (8, 16, 4), (19, 17, 18)], 4) == '[(8, 16, 4)]'\n\n# Solution:","def find_tuples(tuples, k):\n return [tuple for tuple in tuples if all(x % k == 0 for x in tuple)]",False,,5.284353,4,"[""assert find_tuples([(6, 24, 12), (7, 9, 6), (12, 18, 21)], 6) == '[(6, 24, 12)]'"", ""assert find_tuples([(5, 25, 30), (4, 2, 3), (7, 8, 9)], 5) == '[(5, 25, 30)]'"", ""assert find_tuples([(7, 9, 16), (8, 16, 4), (19, 17, 18)], 4) == '[(8, 16, 4)]'""]"
8,78,0.0,Write a python function to find number of integers with odd number of set bits.\n\nassert assert count_With_Odd_SetBits(5) == 3\nassert assert count_With_Odd_SetBits(10) == 5\nassert assert count_With_Odd_SetBits(15) == 8\n\n# Solution:,def count_With_Odd_SetBits(n):\n count = 0\n while n > 0:\n count += n & 1\n n >>= 1\n return count\n\n# Time Complexity: O(log n)\n# Space Complexity: O(1),False,,8.199292,3,"[""assert count_With_Odd_SetBits(5) == 3"", ""assert count_With_Odd_SetBits(10) == 5"", ""assert count_With_Odd_SetBits(15) == 8""]"
9,88,0.0,"Write a function to get the frequency of the elements in a list.\n\nassert assert freq_count([10,10,10,10,20,20,20,20,40,40,50,50,30])==({10: 4, 20: 4, 40: 2, 50: 2, 30: 1})\nassert assert freq_count([1,2,3,4,3,2,4,1,3,1,4])==({1:3, 2:2,3:3,4:3})\nassert assert freq_count([5,6,7,4,9,10,4,5,6,7,9,5])==({10:1,5:3,6:2,7:2,4:2,9:2})\n\n# Solution:",def freq_count(lst):\n return {k: lst.count(k) for k in set(lst)},True,,4.599865,1,"[""assert freq_count([10,10,10,10,20,20,20,20,40,40,50,50,30])==({10: 4, 20: 4, 40: 2, 50: 2, 30: 1}) "", ""assert freq_count([1,2,3,4,3,2,4,1,3,1,4])==({1:3, 2:2,3:3,4:3}) "", ""assert freq_count([5,6,7,4,9,10,4,5,6,7,9,5])==({10:1,5:3,6:2,7:2,4:2,9:2}) ""]"
