In [5]:
# Change pwd to the workspace directory
import os

os.chdir("/app/finetuning_embeddings")

# Get the current working directory
print(os.getcwd())

/app/finetuning_embeddings


In [6]:
from finetuning_embeddings.utils import check_gpu, validate_file_path

In [7]:
print("=== GPU AVAILABILITY CHECK ===")
check_gpu()

=== GPU AVAILABILITY CHECK ===
You have a GPU available!
Device Name: NVIDIA GeForce RTX 4090
Memory Allocated: 0.00 GB
Memory Cached: 0.00 GB
Total Memory: 23.55 GB
CUDA Capability: (8, 9)


In [8]:
# Create dummy example files and test validate_file_path

import tempfile

# 1) Make a temp directory
temp_dir = tempfile.mkdtemp()

# 2) Dummy input file (CSV) – should validate True
csv_file = os.path.join(temp_dir, "test.csv")
with open(csv_file, "w") as f:
    f.write("col1,col2\n1,2")
print("Input existing .csv:", validate_file_path(csv_file, is_output=False))

# 3) Non‐existent input file (JSON) – should be False
json_missing = os.path.join(temp_dir, "missing.json")
print("Input missing .json:", validate_file_path(json_missing, is_output=False))

# 4) Output to existing dir (case‐insensitive .JSON) – should be True
out_json = os.path.join(temp_dir, "out.JSON")
print("Output existing dir .JSON:", validate_file_path(out_json, is_output=True))

# 5) Output to missing dir (.xls) – should be False
out_xls = os.path.join(temp_dir, "no_dir", "file.xls")
print("Output missing dir .xls:", validate_file_path(out_xls, is_output=True))

# 6) Invalid extension – should raise ValueError
try:
    bad = os.path.join(temp_dir, "file.badext")
    validate_file_path(bad)
except ValueError as err:
    print("Invalid extension error:", err)


CSV file validated for input.
Input existing .csv: True
Input missing .json: False
JSON file path is valid for output.
Output existing dir .JSON: True
Output missing dir .xls: False
Invalid extension error: Unsupported file type. Must be .xls, .xlsx, .csv or .json
