# Explore Collected Data from Production

## Initialize Workspace

In [None]:
from azure.identity import DefaultAzureCredential
from azure.ai.ml import MLClient

# Establish a connection to the workspace
ml_client = MLClient.from_config(credential=DefaultAzureCredential())

## Load and Explore Data

In this section, we'll load the data assets, convert them to Pandas DataFrames, and inspect the last record of each dataset to understand the data.

In [None]:
import mltable

def load_and_inspect_data(asset_name, version):
    # Get the data asset
    data_asset = ml_client.data.get(asset_name, version=version)
    
    # Define the path to the data asset
    path = {'folder': data_asset.path}
    
    # Load the data as an mltable object
    tbl = mltable.from_json_lines_files(paths=[path])
    
    # Convert the mltable to a Pandas DataFrame
    df = tbl.to_pandas_dataframe()
    
    # Inspect the last record of the DataFrame
    last_record = df.iloc[-1]
    print(f'Last record of {asset_name}:\n{last_record}\n')

# Base string for the deployment name
deployment_base_name = "<deployment-name>" # Replace with your deployment name

# Construct asset names dynamically based on the deployment name
asset_info = [
    (f"{deployment_base_name}-model_outputs", "1"),
    (f"{deployment_base_name}-model_inputs_outputs", "1"),
    (f"{deployment_base_name}-model_inputs", "1")
]

# Load and inspect each data asset
for asset_name, version in asset_info:
    load_and_inspect_data(asset_name, version)
