## Creating a quality report for two datasets (data_source and ref_data)

In [None]:
%%capture
!pip install -U gretel-client

In [1]:
from gretel_client.config import RunnerMode
from gretel_client.evaluation.quality_report import QualityReport
from gretel_client import configure_session
from gretel_client.projects import create_or_get_unique_project

# Specify your Gretel API key

configure_session(api_key="prompt", cache="yes", validate=True)

data_source = "https://gretel-public-website.s3.us-west-2.amazonaws.com/datasets/USAdultIncome5kGenerated.csv"
ref_data = "https://gretel-public-website.s3.us-west-2.amazonaws.com/datasets/USAdultIncome5k.csv"

Found cached Gretel credentials
Using endpoint https://api-dev.gretel.cloud
Logged in as anastasia@gretel.ai ✅


In [2]:
# Create Quality Report in CLOUD, using a temporary project

cloud_report = QualityReport(data_source=data_source, ref_data=ref_data)
cloud_report.run()
cloud_report.peek()

[32mINFO: [0mStarting poller


{
    "uid": "62cd9d4dc0fe215a31d44eea",
    "guid": "model_2Bqn7qgwG7vQpEe7glp4dc4gWT9",
    "model_name": "wiggly-oafish-sphinx",
    "runner_mode": "cloud",
    "user_id": "629110b1492fbf0f121dcce0",
    "user_guid": "user_29l46LTXd0EnmhRHHfB9DWcO2Sd",
    "billing_domain": "gretel.ai",
    "billing_domain_guid": "domain_28bzIokk1eQdWUYsovba0VN1gtY",
    "project_id": "62cd9d449fb989a899b57219",
    "project_guid": "proj_2Bqn6frmwZnRAs8OohB3LclBztu",
    "status_history": {
        "created": "2022-07-12T16:11:57.168548Z"
    },
    "last_modified": "2022-07-12T16:11:57.312668Z",
    "status": "created",
    "last_active_hb": null,
    "duration_minutes": null,
    "error_msg": null,
    "error_id": null,
    "traceback": null,
    "annotations": null,
    "container_image": "074762682575.dkr.ecr.us-east-2.amazonaws.com/models/evaluate@sha256:ec56e31b2838e9514381dba71e96776df6091853e8c4644b6c118aba8c6fc833",
    "model_type": "evaluate",
    "config": {
        "schema_version": "1.

[32mINFO: [0mStatus is created. Model creation has been queued.
[32mINFO: [0mStatus is pending. A Gretel Cloud worker is being allocated to begin model creation.
[32mINFO: [0mStatus is active. A worker has started creating your model!
2022-07-12T16:12:08.857358Z  Starting Gretel Evaluate
2022-07-12T16:12:08.858485Z  Loading data sets for SQS creation...
2022-07-12T16:12:08.894894Z  Creating SQS...
2022-07-12T16:12:21.104473Z  SQS finished, exporting report artifacts...
2022-07-12T16:12:21.496272Z  Evaluate job completed!
2022-07-12T16:12:21.497492Z  Uploading artifacts to Gretel Cloud


{'raw_score': 100.0, 'grade': 'Excellent', 'score': 100}

In [None]:
cloud_report.as_dict

In [None]:
cloud_report.as_html

In [None]:
# Specify the project name

PROJECT = create_or_get_unique_project(name='Gretel-Evaluate')

# Create Quality Report LOCALLY, using the specified project

local_report = QualityReport(project=PROJECT, data_source=data_source, ref_data=ref_data, runner_mode=RunnerMode.LOCAL, output_dir='report_results')
local_report.run()
local_report.peek()

In [None]:
local_report.as_dict

In [None]:
local_report.as_html