# Check DBFS Classification Path
This notebook checks the contents of '/dbfs/mnt/lab/unrestricted/KritiM/classification/' and verifies trainingSample.csv accessibility.

In [None]:
# Check if we're running in Databricks environment
print("Checking Databricks environment...")
try:
    from pyspark.dbutils import DBUtils
    from pyspark.sql import SparkSession
    
    # Create a Spark session
    spark = SparkSession.builder.appName("PathCheck").getOrCreate()
    dbutils = DBUtils(spark)
    
    # Try to list the path
    print("\nChecking path using dbutils.fs.ls:")
    display(dbutils.fs.ls("dbfs:/mnt/lab/unrestricted/KritiM/classification/"))
except Exception as e:
    print(f"Error: Not running in Databricks environment or not properly configured.\nDetails: {str(e)}\n")
    print("Please make sure you're connected to a Databricks cluster to run this notebook.")

In [None]:
# Method 2: Using os.listdir (filesystem way)
import os
print("\nChecking path using os.listdir:")
path = "/dbfs/mnt/lab/unrestricted/KritiM/classification/"
try:
    files = os.listdir(path)
    for f in files:
        fpath = os.path.join(path, f)
        fsize = os.path.getsize(fpath) if os.path.isfile(fpath) else "DIR"
        print(f"{f:<30} {fsize:>10}")
except Exception as e:
    print(f"Error: {str(e)}")

In [None]:
# Method 3: Check specific file (trainingSample.csv)
print("\nChecking for trainingSample.csv:")
csv_path = "/dbfs/mnt/lab/unrestricted/KritiM/classification/trainingSample.csv"
if os.path.exists(csv_path):
    size_mb = os.path.getsize(csv_path) / (1024 * 1024)
    print(f"trainingSample.csv exists, size: {size_mb:.2f} MB")
    
    # Preview first few lines if it exists
    import pandas as pd
    try:
        df = pd.read_csv(csv_path, nrows=5)
        print("\nFirst 5 rows preview:")
        display(df)
    except Exception as e:
        print(f"Error reading CSV: {str(e)}")
else:
    print("trainingSample.csv not found at this location")

In [None]:
# Method 4: Check mount point status
print("\nChecking all mount points:")
mounts = dbutils.fs.mounts()
for mount in mounts:
    if 'KritiM' in mount.mountPoint:
        print(f"Found relevant mount:")
        print(f"Mount point: {mount.mountPoint}")
        print(f"Source: {mount.source}")

## Alternative Paths
If the mount path is not accessible, we can check some alternative locations where the file might be:

In [None]:
# Check alternative locations
alt_paths = [
    "dbfs:/FileStore/SoilMapping/classification/",
    "dbfs:/mnt/default/SoilMapping/classification/",
    "dbfs:/FileStore/"
]

for path in alt_paths:
    print(f"\nChecking {path}")
    try:
        files = dbutils.fs.ls(path)
        print("Contents:")
        display(files)
    except Exception as e:
        print(f"Error or path not accessible: {str(e)}")