# Initial the configuration for the example notebooks


## Step 1: Copy data from 'data_to_upload' to Amazon S3

### Check that the path to the upload files folder exist

In [None]:
import os

In [None]:
# if model_1 directory does not exist then create it
target_path = "./data_for_upload"

if not os.path.exists(target_path):
    print("Error: data for upload folder is not accessible")

### Post file to Amazon S3

In [None]:
from sagemaker import session as sagemaker_session
from boto3 import client as boto3_client

sess = sagemaker_session.Session()  # sagemaker session for interacting with different AWS APIs
bucket = sess.default_bucket()  # bucket to house artifacts

s3_client = boto3_client("s3")

In [None]:
# Note: s3_data_prefix is part of the Amazon S3 key for where training and test data is stored

s3_data_prefix = "djl-mme-sklearn-data"

In [None]:
#Note: djl_mme_sklearn_data is the full Amazon S3 path to the training and test data

djl_mme_sklearn_data = "s3://{}/{}/".format(bucket, s3_data_prefix)

In [None]:
# Note: startups_test_data_csv is the name of the training and test data file on S3 and used locally

startups_test_data_csv = "50_Startups.csv"

In [None]:
# upload the tarball to Amazon S3 where is will be used to back model requests

with open(f"{target_path}/{startups_test_data_csv}", "rb") as f:
    s3_client.upload_fileobj(f,
                             bucket,
                             f"{s3_data_prefix}/{startups_test_data_csv}")

In [None]:
# Verify that the tar ball is saved to the target location

print(djl_mme_sklearn_data)
!aws s3 ls {djl_mme_sklearn_data}

Store the variable values for later use

## Step 2: Set constant value variables that will be use across notebooks

In [None]:
# Note: s3_model_prefix is part of the Amazon S3 key to where the model tarballs are stored

s3_model_prefix = "djl-mme-sklearn-examples"

In [None]:
# Note: mme_artifacts is the full s3 path to where the model tarballs are stored for use by the MME

mme_artifacts = "s3://{}/{}/".format(bucket, s3_model_prefix)

In [None]:
# Note: This is used when calling the SageMaker Endpoint

content_type = "application/json"

In [None]:
lr_model_reference_name = "sklearn-linear-regression.tar.gz"
etc_model_reference_name = "sklearn-extra-trees-classifier.tar.gz"
moc_model_reference_name = "sklearn-multi-output-classifier.tar.gz"

In [None]:
%store djl_mme_sklearn_data 
%store startups_test_data_csv
%store s3_model_prefix
%store mme_artifacts
%store lr_model_reference_name
%store etc_model_reference_name
%store moc_model_reference_name
%store bucket
%store content_type