In [1]:
# Core ML Libraries
import tensorflow as tf
import keras
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt

# RL Libraries  
import gymnasium as gym
from stable_baselines3 import PPO
from stable_baselines3.common.env_util import make_vec_env

# Utilities
import yaml
from PIL import Image

print("✅ All imports successful!")
print(f"TensorFlow version: {tf.__version__}")
print(f"Keras version: {keras.__version__}")
print(f"NumPy version: {np.__version__}")


✅ All imports successful!
TensorFlow version: 2.19.0
Keras version: 3.10.0
NumPy version: 2.1.3


In [2]:
# Test TensorFlow/Keras
print("🧠 Testing TensorFlow/Keras...")

# Simple neural network
model = keras.Sequential([
    keras.layers.Dense(64, activation='relu', input_shape=(10,)),
    keras.layers.Dense(32, activation='relu'),
    keras.layers.Dense(1, activation='sigmoid')
])

model.compile(optimizer='adam', loss='binary_crossentropy', metrics=['accuracy'])
print(f"✅ Neural network created with {model.count_params()} parameters")

# Test with dummy data
X_test = np.random.random((100, 10))
y_test = np.random.randint(0, 2, 100)

model.fit(X_test, y_test, epochs=5, verbose=0)
print("✅ TensorFlow/Keras training test successful!")


🧠 Testing TensorFlow/Keras...
✅ Neural network created with 2817 parameters


  super().__init__(activity_regularizer=activity_regularizer, **kwargs)


✅ TensorFlow/Keras training test successful!


In [3]:
# Test Gymnasium and Stable-Baselines3
print("🎮 Testing RL environment...")

env = gym.make('CartPole-v1')
observation, info = env.reset()

print(f"Environment: {env.spec.id}")
print(f"Observation space: {env.observation_space}")
print(f"Action space: {env.action_space}")

# Test Stable-Baselines3
env_vec = make_vec_env('CartPole-v1', n_envs=1)
model = PPO('MlpPolicy', env_vec, verbose=0)
print("✅ PPO agent created successfully")

# Quick training test
model.learn(total_timesteps=1000)
print("✅ RL libraries test successful!")

env.close()
env_vec.close()

print("\n🎉 ALL TESTS PASSED! Environment is ready for Escape Cage RL project!")


🎮 Testing RL environment...
Environment: CartPole-v1
Observation space: Box([-4.8               -inf -0.41887903        -inf], [4.8               inf 0.41887903        inf], (4,), float32)
Action space: Discrete(2)
✅ PPO agent created successfully
✅ RL libraries test successful!

🎉 ALL TESTS PASSED! Environment is ready for Escape Cage RL project!
