In [1]:
# Test for the 'dask_ml' Python package

# Step 1: Import the package
try:
    import dask_ml
    from dask_ml.linear_model import LogisticRegression
    from dask_ml.model_selection import train_test_split
    from dask_ml.datasets import make_classification
    from dask.distributed import Client
    print("Step 1: Importing dask_ml and necessary modules passed.")
except Exception as e:
    print(f"Step 1 failed: {str(e)}")
    raise e

# Step 2: Perform a simple operation with dask_ml
try:
    # Set up a Dask client
    client = Client()  # This sets up a Dask scheduler
    print("Step 2: Dask client set up successfully.")

    # Create a synthetic dataset with specified chunks
    X, y = make_classification(n_samples=1000, n_features=20, random_state=42, chunks=100)
    print("Step 2: Synthetic dataset created successfully.")

    # Split the dataset
    X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)
    print("Step 2: Dataset split into training and test sets successfully.")

    # Initialize and fit a logistic regression model
    model = LogisticRegression()
    model.fit(X_train, y_train)
    print("Step 2: Logistic regression model fitted successfully.")

    # Make predictions
    predictions = model.predict(X_test)
    print(f"Step 2: Predictions made successfully. Sample predictions: {predictions[:5].compute()}")

    # Check if the model has been trained
    score = model.score(X_test, y_test).compute()  # Compute the score to get a float value
    print(f"Step 2: Model accuracy on test set: {score:.2f}")
except Exception as e:
    print(f"Step 2 failed: {str(e)}")
    raise e

# Step 3: Shut down the Dask client
try:
    client.close()
    print("Step 3: Dask client shut down successfully.")
except Exception as e:
    print(f"Step 3 failed: {str(e)}")
    raise e

# Final Confirmation
print("All tests for the 'dask_ml' package completed successfully.")


Step 1: Importing dask_ml and necessary modules passed.
Step 2: Dask client set up successfully.
Step 2: Synthetic dataset created successfully.
Step 2: Dataset split into training and test sets successfully.




Step 2: Logistic regression model fitted successfully.
Step 2: Predictions made successfully. Sample predictions: [False  True False False  True]
Step 2: Model accuracy on test set: 0.64
Step 3: Dask client shut down successfully.
All tests for the 'dask_ml' package completed successfully.
