In [None]:
import sys
import subprocess
import torch
import transformers
import numpy as np
import pandas as pd
from PIL import Image
import matplotlib.pyplot as plt
import seaborn as sns

In [None]:
def install_packages():
    """Install required packages for multimodal AI research"""
    packages = [
        "torch torchvision torchaudio",
        "transformers datasets",
        "opencv-python librosa",
        "wandb tensorboard",
        "accelerate deepspeed",
        "timm albumentations",
        "whisper-openai",
        "diffusers",
        "sentence-transformers"
    ]
    
    for package in packages:
        try:
            subprocess.check_call([sys.executable, "-m", "pip", "install", package])
            print(f"✓ Installed {package}")
        except subprocess.CalledProcessError:
            print(f"✗ Failed to install {package}")

In [None]:
def check_gpu_setup():
    """Check GPU availability and configuration"""
    print("=== GPU Setup Check ===")
    print(f"CUDA available: {torch.cuda.is_available()}")
    if torch.cuda.is_available():
        print(f"CUDA version: {torch.version.cuda}")
        print(f"GPU count: {torch.cuda.device_count()}")
        for i in range(torch.cuda.device_count()):
            print(f"GPU {i}: {torch.cuda.get_device_name(i)}")
            print(f"Memory: {torch.cuda.get_device_properties(i).total_memory / 1e9:.1f} GB")
    
    # Test basic tensor operations
    device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
    x = torch.randn(1000, 1000).to(device)
    y = torch.mm(x, x.t())
    print(f"✓ Basic tensor operations working on {device}")

In [None]:
def test_libraries():
    """Test core libraries functionality"""
    print("\n=== Library Tests ===")
    
    # Test transformers
    try:
        from transformers import AutoTokenizer
        tokenizer = AutoTokenizer.from_pretrained("bert-base-uncased")
        tokens = tokenizer("Hello world!")
        print("✓ Transformers library working")
    except Exception as e:
        print(f"✗ Transformers error: {e}")
    
    # Test computer vision
    try:
        import cv2
        import torchvision.transforms as transforms
        transform = transforms.Compose([transforms.Resize((224, 224))])
        print("✓ Computer vision libraries working")
    except Exception as e:
        print(f"✗ CV libraries error: {e}")
    
    # Test audio processing
    try:
        import librosa
        print("✓ Audio processing libraries working")
    except Exception as e:
        print(f"✗ Audio libraries error: {e}")

In [None]:
check_gpu_setup()
test_libraries()