In [3]:
import os
import random
import shutil
from tqdm import tqdm

# Path to directories
source_dir = "/storage/disk2/sam_resized"
subset_dir = "/storage/disk2/sam_resized_subset"

# Create the subset directory if it doesn't exist
os.makedirs(subset_dir, exist_ok=True)

# Get list of image files
image_files = [f for f in os.listdir(source_dir) if f.endswith(('.jpg', '.jpeg', '.png'))]

# Randomly select 200 images
selected_images = random.sample(image_files, 200)

# Move the selected images
print("Moving images...")
for filename in tqdm(selected_images):
    source_path = os.path.join(source_dir, filename)
    dest_path = os.path.join(subset_dir, filename)
    shutil.copy2(source_path, dest_path)  # Using copy2 to preserve metadata

print(f"\nSuccessfully copied 200 images to {subset_dir}")

Moving images...


100%|██████████| 200/200 [00:00<00:00, 563.78it/s]


Successfully copied 200 images to /storage/disk2/sam_resized_subset





In [2]:
import os
from PIL import Image
import numpy as np
from tqdm import tqdm

# Path to images
image_dir = "/storage/disk2/sam_resized"

# Lists to store dimensions
heights = []
widths = []

# Iterate through all images
print("Reading images...")
for filename in tqdm(os.listdir(image_dir)):
    if filename.endswith(('.jpg', '.jpeg', '.png')):
        img_path = os.path.join(image_dir, filename)
        try:
            with Image.open(img_path) as img:
                width, height = img.size
                heights.append(height)
                widths.append(width)
        except Exception as e:
            print(f"Error reading {filename}: {e}")

# Convert to numpy arrays for statistics
heights = np.array(heights)
widths = np.array(widths)

print("\nHeight Statistics:")
print(f"Min: {heights.min()}")
print(f"Max: {heights.max()}")
print(f"Mean: {heights.mean():.2f}")
print(f"Std: {heights.std():.2f}")

print("\nWidth Statistics:")
print(f"Min: {widths.min()}")
print(f"Max: {widths.max()}")
print(f"Mean: {widths.mean():.2f}")
print(f"Std: {widths.std():.2f}")


Reading images...


100%|██████████| 1096228/1096228 [07:02<00:00, 2596.77it/s]



Height Statistics:
Min: 700
Max: 3093
Mean: 761.31
Std: 133.56

Width Statistics:
Min: 700
Max: 5287
Mean: 987.31
Std: 175.16


In [5]:
# Check available space
import os
import shutil

def get_disk_usage(path):
    total, used, free = shutil.disk_usage(path)
    print(f"Total: {total // (2**30)} GiB")
    print(f"Used: {used // (2**30)} GiB")
    print(f"Free: {free // (2**30)} GiB")

# Check a few common locations
paths_to_check = [
    "/storage/disk2",  # Where your sam_resized data is
    os.getcwd(),       # Current working directory
    "/tmp"            # Temporary directory
]

for path in paths_to_check:
    print(f"\nChecking {path}:")
    get_disk_usage(path)


Checking /storage/disk2:
Total: 3519 GiB
Used: 617 GiB
Free: 2723 GiB

Checking /storage/disk0/arda/dinov2:
Total: 3519 GiB
Used: 1665 GiB
Free: 1675 GiB

Checking /tmp:
Total: 97 GiB
Used: 89 GiB
Free: 3 GiB


In [6]:
import os
import glob

def cleanup_vscode_tmp():
    # Remove VSCode IPC files
    vscode_patterns = [
        '/tmp/vscode-ipc-*',
        '/tmp/vscode-typescript*'
    ]
    
    files_removed = 0
    for pattern in vscode_patterns:
        files = glob.glob(pattern)
        for file in files:
            try:
                os.remove(file)
                files_removed += 1
            except OSError as e:
                print(f"Error removing {file}: {e}")
    
    print(f"Removed {files_removed} VSCode temporary files")

# Run cleanup
cleanup_vscode_tmp()

Error removing /tmp/vscode-ipc-dd31a14c-87e3-421e-99dd-37d7ee8b5905.sock: [Errno 1] Operation not permitted: '/tmp/vscode-ipc-dd31a14c-87e3-421e-99dd-37d7ee8b5905.sock'
Error removing /tmp/vscode-ipc-5ca6a324-f007-4a5e-9481-3855c60e8364.sock: [Errno 1] Operation not permitted: '/tmp/vscode-ipc-5ca6a324-f007-4a5e-9481-3855c60e8364.sock'
Error removing /tmp/vscode-ipc-61c0e819-ac41-4c52-a69b-ef75eecc44b2.sock: [Errno 1] Operation not permitted: '/tmp/vscode-ipc-61c0e819-ac41-4c52-a69b-ef75eecc44b2.sock'
Error removing /tmp/vscode-ipc-9b03e393-bd1d-48a2-aa88-123e09ddcccd.sock: [Errno 1] Operation not permitted: '/tmp/vscode-ipc-9b03e393-bd1d-48a2-aa88-123e09ddcccd.sock'
Error removing /tmp/vscode-ipc-c03ce3dd-b526-47a5-b9d8-65a7024a47f6.sock: [Errno 1] Operation not permitted: '/tmp/vscode-ipc-c03ce3dd-b526-47a5-b9d8-65a7024a47f6.sock'
Error removing /tmp/vscode-ipc-d997661b-8548-49f0-8425-b0145d6012cd.sock: [Errno 1] Operation not permitted: '/tmp/vscode-ipc-d997661b-8548-49f0-8425-b0145