In [9]:
# %%
# -----------------------------------------------------
# Import Workspace class 
# -----------------------------------------------------
from azureml.core import Workspace, Datastore, Dataset
from azure.identity import DefaultAzureCredential

In [None]:
# %%
# -----------------------------------------------------
#  Create the workspace
# -----------------------------------------------------
ws = Workspace.create(name='AzureMLWS04',
                      subscription_id='9d1e7df0-a4cd-45d3-94d0-9c9208ce45ee',
                      resource_group='teodora.davidkova-rg',
                      create_resource_group=False,   # True if it does not exist
                      location='westeurope')


In [None]:
print(ws.name, ws.location, ws.resource_group, ws.subscription_id)


In [3]:
# %%
# -----------------------------------------------------
# List all the workspaces within a subscription
# -----------------------------------------------------

ws_list = Workspace.list(subscription_id="9d1e7df0-a4cd-45d3-94d0-9c9208ce45ee")
ws_list = list(ws_list)
print(ws_list)

['AzureMLWS01', 'AzureMLWS04']


In [None]:
# %%
import json
# Load the configuration file
with open('./config.json', 'r') as config_file:
    config = json.load(config_file)

print(config)
# Extract the account key from the configuration
storage_account_key = config.get('storage_account_key')
ws = Workspace(subscription_id=config.get('subscription_id'),
               workspace_name=config.get('workspace_name'),
               resource_group=config.get('resource_group'))
print(ws.name)


In [12]:
# -----------------------------------------------------
# Create a datastore 
# -----------------------------------------------------
az_store = Datastore.register_azure_blob_container(
            workspace=ws,
            datastore_name="experiment_data",
            account_name="tddata01", # storage account name
            container_name="cont01",
            account_key=storage_account_key) #storage account key

In [5]:
# %%
# -----------------------------------------------------
# Access datastore by its name
# -----------------------------------------------------
# %%
# -----------------------------------------------------
# List all the datastores
# -----------------------------------------------------
store_list = list(ws.datastores)
print(store_list)

az_store = Datastore.get(ws, "experiment_data")

['experiment_data', 'cont02', 'workspaceworkingdirectory', 'workspaceartifactstore', 'workspacefilestore', 'workspaceblobstore']


In [18]:
# %%
# -----------------------------------------------------
# Upload folder or directory to the storage account
# -----------------------------------------------------
az_store.upload(src_dir="./data",
                target_path="Loan Data/data",
                overwrite=True)

Uploading an estimated of 5 files
Uploading ./data\defaults.csv
Uploaded ./data\defaults.csv, 1 files out of an estimated total of 5
Uploading ./data\Loan+Approval+Prediction.csv
Uploaded ./data\Loan+Approval+Prediction.csv, 2 files out of an estimated total of 5
Uploading ./data\Loan+Data.csv
Uploaded ./data\Loan+Data.csv, 3 files out of an estimated total of 5
Uploading ./data\test.csv
Uploaded ./data\test.csv, 4 files out of an estimated total of 5
Uploading ./data\test1.csv
Uploaded ./data\test1.csv, 5 files out of an estimated total of 5
Uploaded 5 files


$AZUREML_DATAREFERENCE_a5e407a079ac412eb67e7d86afde4725

In [11]:

# -----------------------------------------------------
# Create and register the dataset
# -----------------------------------------------------

# Create the path of the csv file
csv_path = [(az_store, "Loan Data/data/defaults.csv")]

# Create the dataset
loan_dataset = Dataset.Tabular.from_delimited_files(path=csv_path)

# Register the dataset
loan_dataset = loan_dataset.register(workspace=ws,
                                     name="Defaults",
                                     create_new_version=True)


In [19]:

# -----------------------------------------------------
# Create and register the dataset
# -----------------------------------------------------

# Create the path of the csv file
csv_path = [(az_store, "Loan Data/data/Loan+Approval+Prediction.csv")]

# Create the dataset
loan_dataset2 = Dataset.Tabular.from_delimited_files(path=csv_path)

# Register the dataset
loan_dataset2 = loan_dataset2.register(workspace=ws,
                                     name="LoanApprovalPrediction",
                                     create_new_version=True)


In [17]:
df = loan_dataset.to_pandas_dataframe()

{'infer_column_types': 'False', 'activity': 'to_pandas_dataframe'}
{'infer_column_types': 'False', 'activity': 'to_pandas_dataframe', 'activityApp': 'TabularDataset'}
