# Edit Your Expectation Suite
Use this notebook to recreate and modify your expectation suite:

**Expectation Suite Name**: `testge`


In [93]:
import datetime

import pandas as pd

import great_expectations as ge
import great_expectations.jupyter_ux
from great_expectations.core.batch import BatchRequest
from great_expectations.checkpoint import SimpleCheckpoint
from great_expectations.exceptions import DataContextError

context = ge.data_context.DataContext()

# Note that if you modify this batch request, you may save the new version as a .json file
#  to pass in later via the --batch-request option
batch_request = {'datasource_name': 'SEVIR_CATALOG_1', 'data_connector_name': 'default_inferred_data_connector_name', 'data_asset_name': 'CATALOG.csv', 'limit': 1000}


# Feel free to change the name of your suite here. Renaming this will not remove the other one.
expectation_suite_name = "testge"
try:
    suite = context.get_expectation_suite(expectation_suite_name=expectation_suite_name)
    print(f'Loaded ExpectationSuite "{suite.expectation_suite_name}" containing {len(suite.expectations)} expectations.')
except DataContextError:
    suite = context.create_expectation_suite(expectation_suite_name=expectation_suite_name)
    print(f'Created ExpectationSuite "{suite.expectation_suite_name}".')


validator = context.get_validator(
    batch_request=BatchRequest(**batch_request),
    expectation_suite_name=expectation_suite_name
)
column_names = [f'"{column_name}"' for column_name in validator.columns()]
print(f"Columns: {', '.join(column_names)}.")
validator.head(n_rows=5, fetch_all=False)

  and should_run_async(code)


Loaded ExpectationSuite "testge" containing 85 expectations.


  df = reader_fn(path, **reader_options)


Calculating Metrics:   0%|          | 0/2 [00:00<?, ?it/s]

Columns: "id", "file_name", "file_index", "img_type", "time_utc", "minute_offsets", "episode_id", "event_id", "event_type", "llcrnrlat", "llcrnrlon", "urcrnrlat", "urcrnrlon", "proj", "size_x", "size_y", "height_m", "width_m", "data_min", "data_max", "pct_missing".


Calculating Metrics:   0%|          | 0/1 [00:00<?, ?it/s]

Unnamed: 0,id,file_name,file_index,img_type,time_utc,minute_offsets,episode_id,event_id,event_type,llcrnrlat,llcrnrlon,urcrnrlat,urcrnrlon,proj,size_x,size_y,height_m,width_m,data_min,data_max,pct_missing
0,R18032505027684,vis/2018/SEVIR_VIS_RANDOMEVENTS_2018_0321_0331.h5,0,vis,2018-03-25 05:00:00,-120:-115:-110:-105:-100:-95:-90:-85:-80:-75:-70:-65:-60:-55:-50:-45:-40:-40:-30:-25:-20:-15:-10:-5:0:5:10:15:20:25:30:35:40:45:50:55:60:65:70:75:80:85:90:95:100:105:110:115:120,,,,33.216708,-91.635132,36.336627,-87.070254,+proj=laea +lat_0=38 +lon_0=-98 +units=m +a=6370997.0 +ellps=sphere,768,768,384000.0,384000.0,-0.003361,0.0056,0.0
1,R18032505027677,vis/2018/SEVIR_VIS_RANDOMEVENTS_2018_0321_0331.h5,1,vis,2018-03-25 05:00:00,-120:-115:-110:-105:-100:-95:-90:-85:-80:-75:-70:-65:-60:-55:-50:-45:-40:-40:-30:-25:-20:-15:-10:-5:0:5:10:15:20:25:30:35:40:45:50:55:60:65:70:75:80:85:90:95:100:105:110:115:120,,,,33.084309,-91.849435,36.213723,-87.301535,+proj=laea +lat_0=38 +lon_0=-98 +units=m +a=6370997.0 +ellps=sphere,768,768,384000.0,384000.0,-0.003361,0.0056,0.0
2,R18032505027721,vis/2018/SEVIR_VIS_RANDOMEVENTS_2018_0321_0331.h5,2,vis,2018-03-25 05:00:00,-120:-115:-110:-105:-100:-95:-90:-85:-80:-75:-70:-65:-60:-55:-50:-45:-40:-40:-30:-25:-20:-15:-10:-5:0:5:10:15:20:25:30:35:40:45:50:55:60:65:70:75:80:85:90:95:100:105:110:115:120,,,,46.661866,-123.509928,50.883159,-120.009277,+proj=laea +lat_0=38 +lon_0=-98 +units=m +a=6370997.0 +ellps=sphere,768,768,384000.0,384000.0,-0.00287,0.005548,0.0
3,R18032516508249,vis/2018/SEVIR_VIS_RANDOMEVENTS_2018_0321_0331.h5,3,vis,2018-03-25 16:50:00,-120:-115:-110:-105:-100:-95:-90:-85:-80:-75:-70:-65:-60:-55:-50:-45:-40:-35:-30:-25:-20:-15:-10:-5:0:5:10:15:20:25:30:35:40:45:50:55:60:60:70:75:80:85:90:95:100:105:110:115:120,,,,40.883237,-85.350213,43.686191,-79.903987,+proj=laea +lat_0=38 +lon_0=-98 +units=m +a=6370997.0 +ellps=sphere,768,768,384000.0,384000.0,0.029911,0.7856,0.0
4,R18032516507621,vis/2018/SEVIR_VIS_RANDOMEVENTS_2018_0321_0331.h5,4,vis,2018-03-25 16:50:00,-120:-115:-110:-105:-100:-95:-90:-85:-80:-75:-70:-65:-60:-55:-50:-45:-40:-35:-30:-25:-20:-15:-10:-5:0:5:10:15:20:25:30:35:40:45:50:55:60:60:70:75:80:85:90:95:100:105:110:115:120,,,,44.946047,-123.972935,49.169436,-120.575175,+proj=laea +lat_0=38 +lon_0=-98 +units=m +a=6370997.0 +ellps=sphere,768,768,384000.0,384000.0,0.02856,0.79261,0.0


## Create & Edit Expectations


Add expectations by calling specific expectation methods on the `validator` object. They all begin with `.expect_` which makes autocompleting easy using tab.

Because you selected interactive mode, you are now creating or editing an Expectation Suite with validator feedback from the sample batch of data that you specified (see `batch_request`).

Note that if you select manual mode you may still create or edit an Expectation Suite directly, without feedback from the `validator`. See our documentation for more info and examples: [How to create a new Expectation Suite without a sample batch](https://docs.greatexpectations.io/docs/guides/expectations/how_to_create_and_edit_expectations_based_on_domain_knowledge_without_inspecting_data_directly).



You can see all the available expectations in the **[expectation gallery](https://greatexpectations.io/expectations)**.

### Table Expectation(s)

In [94]:

validator.expect_table_columns_to_match_set(column_set=['event_id', 'episode_id', 'data_min', 'pct_missing', 'width_m', 'event_type', 'time_utc', 'id', 'urcrnrlon', 'llcrnrlat', 'llcrnrlon', 'file_name', 'data_max', 'minute_offsets', 'size_x', 'img_type', 'proj', 'height_m', 'urcrnrlat', 'size_y', 'file_index'])

  and should_run_async(code)


Calculating Metrics:   0%|          | 0/2 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": [
      "id",
      "file_name",
      "file_index",
      "img_type",
      "time_utc",
      "minute_offsets",
      "episode_id",
      "event_id",
      "event_type",
      "llcrnrlat",
      "llcrnrlon",
      "urcrnrlat",
      "urcrnrlon",
      "proj",
      "size_x",
      "size_y",
      "height_m",
      "width_m",
      "data_min",
      "data_max",
      "pct_missing"
    ]
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [95]:

validator.expect_table_row_count_to_be_between(max_value=76004, min_value=76004)

Calculating Metrics:   0%|          | 0/1 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 76004
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

### Column Expectation(s)

#### `id`

In [96]:

validator.expect_column_values_to_not_be_null(column='id', meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'id'}, 'metric_dependencies': None, 'metric_name': 'column_values.nonnull.unexpected_count', 'metric_value_kwargs': None}, 'num_batches': 2}})

Calculating Metrics:   0%|          | 0/6 [00:00<?, ?it/s]

  return list(domain_values[: result_format["partial_unexpected_count"]])


{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": []
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [99]:

validator.expect_column_value_lengths_to_be_between(column='id', max_value=15, min_value=7, mostly=1.0, strict_max=False, strict_min=False, meta={'profiler_details': {'column_max_length_range_estimator': {'metric_configuration': {'domain_kwargs': {'column': 'id'}, 'metric_dependencies': None, 'metric_name': 'column_values.length.max', 'metric_value_kwargs': None}, 'num_batches': 1}, 'column_min_length_range_estimator': {'metric_configuration': {'domain_kwargs': {'column': 'id'}, 'metric_dependencies': None, 'metric_name': 'column_values.length.min', 'metric_value_kwargs': None}, 'num_batches': 1}}})

Calculating Metrics:   0%|          | 0/9 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": [],
    "missing_count": 0,
    "missing_percent": 0.0,
    "unexpected_percent_total": 0.0,
    "unexpected_percent_nonmissing": 0.0
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [100]:

validator.expect_column_values_to_match_regex(column='id', mostly=1.0, regex='-?\d+', meta={'profiler_details': {'evaluated_regexes': {'(?:25[0-5]|2[0-4]\\d|[01]\\d{2}|\\d{1,2})(?:.(?:25[0-5]|2[0-4]\\d|[01]\\d{2}|\\d{1,2})){3}': 0.7810115257091732, '-?\\d+': 1.0, '-?\\d+(?:\\.\\d*)?': 1.0, '<\\/?(?:p|a|b|img)(?: \\/)?>': 0.0, '[A-Za-z0-9\\.,;:!?()\\"\'%\\-]+': 1.0, '\\b[0-9a-fA-F]{8}\\b-[0-9a-fA-F]{4}-[0-5][0-9a-fA-F]{3}-[089ab][0-9a-fA-F]{3}-\\b[0-9a-fA-F]{12}\\b ': 0.0, '\\d+': 1.0, '\\s+$': 0.0, '^\\s+': 0.0, 'https?:\\/\\/(?:www\\.)?[-a-zA-Z0-9@:%._\\+~#=]{2,255}\\.[a-z]{2,6}\\b(?:[-a-zA-Z0-9@:%_\\+.~#()?&//=]*)': 0.0}, 'success_ratio': 1.0}})

  validator.expect_column_values_to_match_regex(column='id', mostly=1.0, regex='-?\d+', meta={'profiler_details': {'evaluated_regexes': {'(?:25[0-5]|2[0-4]\\d|[01]\\d{2}|\\d{1,2})(?:.(?:25[0-5]|2[0-4]\\d|[01]\\d{2}|\\d{1,2})){3}': 0.7810115257091732, '-?\\d+': 1.0, '-?\\d+(?:\\.\\d*)?': 1.0, '<\\/?(?:p|a|b|img)(?: \\/)?>': 0.0, '[A-Za-z0-9\\.,;:!?()\\"\'%\\-]+': 1.0, '\\b[0-9a-fA-F]{8}\\b-[0-9a-fA-F]{4}-[0-5][0-9a-fA-F]{3}-[089ab][0-9a-fA-F]{3}-\\b[0-9a-fA-F]{12}\\b ': 0.0, '\\d+': 1.0, '\\s+$': 0.0, '^\\s+': 0.0, 'https?:\\/\\/(?:www\\.)?[-a-zA-Z0-9@:%._\\+~#=]{2,255}\\.[a-z]{2,6}\\b(?:[-a-zA-Z0-9@:%_\\+.~#()?&//=]*)': 0.0}, 'success_ratio': 1.0}})


Calculating Metrics:   0%|          | 0/8 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": [],
    "missing_count": 0,
    "missing_percent": 0.0,
    "unexpected_percent_total": 0.0,
    "unexpected_percent_nonmissing": 0.0
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [101]:
validator.expect_column_values_to_be_unique(column='id', meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'id'}, 'metric_dependencies': None, 'metric_name': 'column_values.unique', 'metric_value_kwargs': None}, 'num_batches': 2}})

Calculating Metrics:   0%|          | 0/8 [00:00<?, ?it/s]

{
  "success": false,
  "result": {
    "element_count": 76004,
    "unexpected_count": 70352,
    "unexpected_percent": 92.56354928687965,
    "partial_unexpected_list": [
      "R18032505027684",
      "R18032505027677",
      "R18032505027721",
      "R18032516508249",
      "R18032516507621",
      "R18032516508005",
      "R18032516508688",
      "R18032516507720",
      "R18032516507955",
      "R18032810357425",
      "R18032810357459",
      "R18032810357525",
      "R18032810357497",
      "R18032216107876",
      "R18032216107750",
      "R18032216107338",
      "R18032216107425",
      "R18032216107405",
      "R18032216107389",
      "R18032216107419"
    ],
    "missing_count": 0,
    "missing_percent": 0.0,
    "unexpected_percent_total": 92.56354928687965,
    "unexpected_percent_nonmissing": 92.56354928687965
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

#### `file_name`

In [102]:

validator.expect_column_values_to_not_be_null(column='file_name', meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'file_name'}, 'metric_dependencies': None, 'metric_name': 'column_values.nonnull.unexpected_count', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/6 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": []
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [103]:

validator.expect_column_value_lengths_to_be_between(column='file_name', max_value=53, min_value=48, mostly=1.0, strict_max=False, strict_min=False, meta={'profiler_details': {'column_max_length_range_estimator': {'metric_configuration': {'domain_kwargs': {'column': 'file_name'}, 'metric_dependencies': None, 'metric_name': 'column_values.length.max', 'metric_value_kwargs': None}, 'num_batches': 1}, 'column_min_length_range_estimator': {'metric_configuration': {'domain_kwargs': {'column': 'file_name'}, 'metric_dependencies': None, 'metric_name': 'column_values.length.min', 'metric_value_kwargs': None}, 'num_batches': 1}}})

Calculating Metrics:   0%|          | 0/9 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": [],
    "missing_count": 0,
    "missing_percent": 0.0,
    "unexpected_percent_total": 0.0,
    "unexpected_percent_nonmissing": 0.0
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [104]:

validator.expect_column_values_to_match_regex(column='file_name', mostly=1.0, regex='(?:25[0-5]|2[0-4]\d|[01]\d{2}|\d{1,2})(?:.(?:25[0-5]|2[0-4]\d|[01]\d{2}|\d{1,2})){3}', meta={'profiler_details': {'evaluated_regexes': {'(?:25[0-5]|2[0-4]\\d|[01]\\d{2}|\\d{1,2})(?:.(?:25[0-5]|2[0-4]\\d|[01]\\d{2}|\\d{1,2})){3}': 1.0, '-?\\d+': 1.0, '-?\\d+(?:\\.\\d*)?': 1.0, '<\\/?(?:p|a|b|img)(?: \\/)?>': 0.0, '[A-Za-z0-9\\.,;:!?()\\"\'%\\-]+': 1.0, '\\b[0-9a-fA-F]{8}\\b-[0-9a-fA-F]{4}-[0-5][0-9a-fA-F]{3}-[089ab][0-9a-fA-F]{3}-\\b[0-9a-fA-F]{12}\\b ': 0.0, '\\d+': 1.0, '\\s+$': 0.0, '^\\s+': 0.0, 'https?:\\/\\/(?:www\\.)?[-a-zA-Z0-9@:%._\\+~#=]{2,255}\\.[a-z]{2,6}\\b(?:[-a-zA-Z0-9@:%_\\+.~#()?&//=]*)': 0.0}, 'success_ratio': 1.0}})

  validator.expect_column_values_to_match_regex(column='file_name', mostly=1.0, regex='(?:25[0-5]|2[0-4]\d|[01]\d{2}|\d{1,2})(?:.(?:25[0-5]|2[0-4]\d|[01]\d{2}|\d{1,2})){3}', meta={'profiler_details': {'evaluated_regexes': {'(?:25[0-5]|2[0-4]\\d|[01]\\d{2}|\\d{1,2})(?:.(?:25[0-5]|2[0-4]\\d|[01]\\d{2}|\\d{1,2})){3}': 1.0, '-?\\d+': 1.0, '-?\\d+(?:\\.\\d*)?': 1.0, '<\\/?(?:p|a|b|img)(?: \\/)?>': 0.0, '[A-Za-z0-9\\.,;:!?()\\"\'%\\-]+': 1.0, '\\b[0-9a-fA-F]{8}\\b-[0-9a-fA-F]{4}-[0-5][0-9a-fA-F]{3}-[089ab][0-9a-fA-F]{3}-\\b[0-9a-fA-F]{12}\\b ': 0.0, '\\d+': 1.0, '\\s+$': 0.0, '^\\s+': 0.0, 'https?:\\/\\/(?:www\\.)?[-a-zA-Z0-9@:%._\\+~#=]{2,255}\\.[a-z]{2,6}\\b(?:[-a-zA-Z0-9@:%_\\+.~#()?&//=]*)': 0.0}, 'success_ratio': 1.0}})


Calculating Metrics:   0%|          | 0/8 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": [],
    "missing_count": 0,
    "missing_percent": 0.0,
    "unexpected_percent_total": 0.0,
    "unexpected_percent_nonmissing": 0.0
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

#### `file_index`

In [105]:

validator.expect_column_values_to_not_be_null(column='file_index', meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'file_index'}, 'metric_dependencies': None, 'metric_name': 'column_values.nonnull.unexpected_count', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/6 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": []
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [106]:

validator.expect_column_min_to_be_between(column='file_index', max_value=0, min_value=0, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'file_index'}, 'metric_dependencies': None, 'metric_name': 'column.min', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 0
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [107]:

validator.expect_column_max_to_be_between(column='file_index', max_value=2367, min_value=2367, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'file_index'}, 'metric_dependencies': None, 'metric_name': 'column.max', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 2367
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [108]:

validator.expect_column_values_to_be_between(column='file_index', max_value=2367, min_value=0, mostly=1.0, strict_max=False, strict_min=False, meta={'profiler_details': {'column_max_values_range_estimator': {'metric_configuration': {'domain_kwargs': {'column': 'file_index'}, 'metric_dependencies': None, 'metric_name': 'column.max', 'metric_value_kwargs': None}, 'num_batches': 1}, 'column_min_values_range_estimator': {'metric_configuration': {'domain_kwargs': {'column': 'file_index'}, 'metric_dependencies': None, 'metric_name': 'column.min', 'metric_value_kwargs': None}, 'num_batches': 1}}})

Calculating Metrics:   0%|          | 0/8 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": [],
    "missing_count": 0,
    "missing_percent": 0.0,
    "unexpected_percent_total": 0.0,
    "unexpected_percent_nonmissing": 0.0
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [109]:

validator.expect_column_quantile_values_to_be_between(column='file_index', allow_relative_error=False, quantile_ranges={'quantiles': [0.25, 0.5, 0.75], 'value_ranges': [[34, 34], [288, 288], [953, 953]]}, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'file_index'}, 'metric_dependencies': None, 'metric_name': 'column.quantile_values', 'metric_value_kwargs': {'allow_relative_error': False, 'quantiles': [0.25, 0.5, 0.75]}}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": {
      "quantiles": [
        0.25,
        0.5,
        0.75
      ],
      "values": [
        34,
        288,
        953
      ]
    },
    "details": {
      "success_details": [
        true,
        true,
        true
      ]
    }
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [110]:

validator.expect_column_median_to_be_between(column='file_index', max_value=288.0, min_value=288.0, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'file_index'}, 'metric_dependencies': None, 'metric_name': 'column.median', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 288.0
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [111]:

validator.expect_column_mean_to_be_between(column='file_index', max_value=560.197529077417, min_value=560.197529077417, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'file_index'}, 'metric_dependencies': None, 'metric_name': 'column.mean', 'metric_value_kwargs': None}, 'num_batches': 1}})

  and should_run_async(code)


Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 560.197529077417
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [112]:

validator.expect_column_stdev_to_be_between(column='file_index', max_value=623.8829221285116, min_value=623.8829221285116, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'file_index'}, 'metric_dependencies': None, 'metric_name': 'column.standard_deviation', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 623.8829221285116
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

#### `img_type`

In [113]:

validator.expect_column_values_to_not_be_null(column='img_type', meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'img_type'}, 'metric_dependencies': None, 'metric_name': 'column_values.nonnull.unexpected_count', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/6 [00:00<?, ?it/s]

  return list(domain_values[: result_format["partial_unexpected_count"]])


{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": []
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [114]:

validator.expect_column_value_lengths_to_be_between(column='img_type', max_value=5, min_value=3, mostly=1.0, strict_max=False, strict_min=False, meta={'profiler_details': {'column_max_length_range_estimator': {'metric_configuration': {'domain_kwargs': {'column': 'img_type'}, 'metric_dependencies': None, 'metric_name': 'column_values.length.max', 'metric_value_kwargs': None}, 'num_batches': 1}, 'column_min_length_range_estimator': {'metric_configuration': {'domain_kwargs': {'column': 'img_type'}, 'metric_dependencies': None, 'metric_name': 'column_values.length.min', 'metric_value_kwargs': None}, 'num_batches': 1}}})

Calculating Metrics:   0%|          | 0/9 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": [],
    "missing_count": 0,
    "missing_percent": 0.0,
    "unexpected_percent_total": 0.0,
    "unexpected_percent_nonmissing": 0.0
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [115]:

validator.expect_column_values_to_match_regex(column='img_type', mostly=1.0, regex='[A-Za-z0-9\.,;:!?()\"'%\-]+', meta={'profiler_details': {'evaluated_regexes': {'(?:25[0-5]|2[0-4]\\d|[01]\\d{2}|\\d{1,2})(?:.(?:25[0-5]|2[0-4]\\d|[01]\\d{2}|\\d{1,2})){3}': 0.0, '-?\\d+': 0.3564680806273354, '-?\\d+(?:\\.\\d*)?': 0.3564680806273354, '<\\/?(?:p|a|b|img)(?: \\/)?>': 0.0, '[A-Za-z0-9\\.,;:!?()\\"\'%\\-]+': 1.0, '\\b[0-9a-fA-F]{8}\\b-[0-9a-fA-F]{4}-[0-5][0-9a-fA-F]{3}-[089ab][0-9a-fA-F]{3}-\\b[0-9a-fA-F]{12}\\b ': 0.0, '\\d+': 0.3564680806273354, '\\s+$': 0.0, '^\\s+': 0.0, 'https?:\\/\\/(?:www\\.)?[-a-zA-Z0-9@:%._\\+~#=]{2,255}\\.[a-z]{2,6}\\b(?:[-a-zA-Z0-9@:%_\\+.~#()?&//=]*)': 0.0}, 'success_ratio': 1.0}})

  validator.expect_column_values_to_match_regex(column='img_type', mostly=1.0, regex='[A-Za-z0-9\.,;:!?()\"'%\-]+', meta={'profiler_details': {'evaluated_regexes': {'(?:25[0-5]|2[0-4]\\d|[01]\\d{2}|\\d{1,2})(?:.(?:25[0-5]|2[0-4]\\d|[01]\\d{2}|\\d{1,2})){3}': 0.0, '-?\\d+': 0.3564680806273354, '-?\\d+(?:\\.\\d*)?': 0.3564680806273354, '<\\/?(?:p|a|b|img)(?: \\/)?>': 0.0, '[A-Za-z0-9\\.,;:!?()\\"\'%\\-]+': 1.0, '\\b[0-9a-fA-F]{8}\\b-[0-9a-fA-F]{4}-[0-5][0-9a-fA-F]{3}-[089ab][0-9a-fA-F]{3}-\\b[0-9a-fA-F]{12}\\b ': 0.0, '\\d+': 0.3564680806273354, '\\s+$': 0.0, '^\\s+': 0.0, 'https?:\\/\\/(?:www\\.)?[-a-zA-Z0-9@:%._\\+~#=]{2,255}\\.[a-z]{2,6}\\b(?:[-a-zA-Z0-9@:%_\\+.~#()?&//=]*)': 0.0}, 'success_ratio': 1.0}})


SyntaxError: unexpected character after line continuation character (<ipython-input-115-f761df33b842>, line 1)

In [117]:

validator.expect_column_values_to_be_in_set(column='img_type', mostly=1.0, value_set=['ir107', 'vil', 'lght', 'vis', 'ir069'], meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'img_type'}, 'metric_dependencies': None, 'metric_name': 'column.distinct_values', 'metric_value_kwargs': None}, 'num_batches': 1, 'parse_strings_as_datetimes': False}})

Calculating Metrics:   0%|          | 0/8 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": [],
    "missing_count": 0,
    "missing_percent": 0.0,
    "unexpected_percent_total": 0.0,
    "unexpected_percent_nonmissing": 0.0
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [118]:

validator.expect_column_unique_value_count_to_be_between(column='img_type', max_value=5, min_value=5, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'img_type'}, 'metric_dependencies': None, 'metric_name': 'column.distinct_values.count', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 5
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [119]:

validator.expect_column_proportion_of_unique_values_to_be_between(column='img_type', max_value=6.578601126256512e-05, min_value=6.578601126256512e-05, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'img_type'}, 'metric_dependencies': None, 'metric_name': 'column.unique_proportion', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/7 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 6.578601126256512e-05
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

#### `time_utc`

In [120]:

validator.expect_column_values_to_not_be_null(column='time_utc', meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'time_utc'}, 'metric_dependencies': None, 'metric_name': 'column_values.nonnull.unexpected_count', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/6 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": []
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [121]:

validator.expect_column_value_lengths_to_be_between(column='time_utc', max_value=19, min_value=19, mostly=1.0, strict_max=False, strict_min=False, meta={'profiler_details': {'column_max_length_range_estimator': {'metric_configuration': {'domain_kwargs': {'column': 'time_utc'}, 'metric_dependencies': None, 'metric_name': 'column_values.length.max', 'metric_value_kwargs': None}, 'num_batches': 1}, 'column_min_length_range_estimator': {'metric_configuration': {'domain_kwargs': {'column': 'time_utc'}, 'metric_dependencies': None, 'metric_name': 'column_values.length.min', 'metric_value_kwargs': None}, 'num_batches': 1}}})

Calculating Metrics:   0%|          | 0/9 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": [],
    "missing_count": 0,
    "missing_percent": 0.0,
    "unexpected_percent_total": 0.0,
    "unexpected_percent_nonmissing": 0.0
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [122]:

validator.expect_column_values_to_match_regex(column='time_utc', mostly=1.0, regex='(?:25[0-5]|2[0-4]\d|[01]\d{2}|\d{1,2})(?:.(?:25[0-5]|2[0-4]\d|[01]\d{2}|\d{1,2})){3}', meta={'profiler_details': {'evaluated_regexes': {'(?:25[0-5]|2[0-4]\\d|[01]\\d{2}|\\d{1,2})(?:.(?:25[0-5]|2[0-4]\\d|[01]\\d{2}|\\d{1,2})){3}': 1.0, '-?\\d+': 1.0, '-?\\d+(?:\\.\\d*)?': 1.0, '<\\/?(?:p|a|b|img)(?: \\/)?>': 0.0, '[A-Za-z0-9\\.,;:!?()\\"\'%\\-]+': 1.0, '\\b[0-9a-fA-F]{8}\\b-[0-9a-fA-F]{4}-[0-5][0-9a-fA-F]{3}-[089ab][0-9a-fA-F]{3}-\\b[0-9a-fA-F]{12}\\b ': 0.0, '\\d+': 1.0, '\\s+$': 0.0, '^\\s+': 0.0, 'https?:\\/\\/(?:www\\.)?[-a-zA-Z0-9@:%._\\+~#=]{2,255}\\.[a-z]{2,6}\\b(?:[-a-zA-Z0-9@:%_\\+.~#()?&//=]*)': 0.0}, 'success_ratio': 1.0}})

  validator.expect_column_values_to_match_regex(column='time_utc', mostly=1.0, regex='(?:25[0-5]|2[0-4]\d|[01]\d{2}|\d{1,2})(?:.(?:25[0-5]|2[0-4]\d|[01]\d{2}|\d{1,2})){3}', meta={'profiler_details': {'evaluated_regexes': {'(?:25[0-5]|2[0-4]\\d|[01]\\d{2}|\\d{1,2})(?:.(?:25[0-5]|2[0-4]\\d|[01]\\d{2}|\\d{1,2})){3}': 1.0, '-?\\d+': 1.0, '-?\\d+(?:\\.\\d*)?': 1.0, '<\\/?(?:p|a|b|img)(?: \\/)?>': 0.0, '[A-Za-z0-9\\.,;:!?()\\"\'%\\-]+': 1.0, '\\b[0-9a-fA-F]{8}\\b-[0-9a-fA-F]{4}-[0-5][0-9a-fA-F]{3}-[089ab][0-9a-fA-F]{3}-\\b[0-9a-fA-F]{12}\\b ': 0.0, '\\d+': 1.0, '\\s+$': 0.0, '^\\s+': 0.0, 'https?:\\/\\/(?:www\\.)?[-a-zA-Z0-9@:%._\\+~#=]{2,255}\\.[a-z]{2,6}\\b(?:[-a-zA-Z0-9@:%_\\+.~#()?&//=]*)': 0.0}, 'success_ratio': 1.0}})


Calculating Metrics:   0%|          | 0/8 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": [],
    "missing_count": 0,
    "missing_percent": 0.0,
    "unexpected_percent_total": 0.0,
    "unexpected_percent_nonmissing": 0.0
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

#### `llcrnrlat`

In [123]:

validator.expect_column_values_to_not_be_null(column='llcrnrlat', meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'llcrnrlat'}, 'metric_dependencies': None, 'metric_name': 'column_values.nonnull.unexpected_count', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/6 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": []
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [124]:

validator.expect_column_min_to_be_between(column='llcrnrlat', max_value=22.037719406438192, min_value=22.037719406438192, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'llcrnrlat'}, 'metric_dependencies': None, 'metric_name': 'column.min', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 22.037719406438192
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [125]:

validator.expect_column_max_to_be_between(column='llcrnrlat', max_value=47.6451952545839, min_value=47.6451952545839, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'llcrnrlat'}, 'metric_dependencies': None, 'metric_name': 'column.max', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 47.6451952545839
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [126]:

validator.expect_column_values_to_be_between(column='llcrnrlat', max_value=47.6451952545839, min_value=22.037719406438192, mostly=1.0, strict_max=False, strict_min=False, meta={'profiler_details': {'column_max_values_range_estimator': {'metric_configuration': {'domain_kwargs': {'column': 'llcrnrlat'}, 'metric_dependencies': None, 'metric_name': 'column.max', 'metric_value_kwargs': None}, 'num_batches': 1}, 'column_min_values_range_estimator': {'metric_configuration': {'domain_kwargs': {'column': 'llcrnrlat'}, 'metric_dependencies': None, 'metric_name': 'column.min', 'metric_value_kwargs': None}, 'num_batches': 1}}})

Calculating Metrics:   0%|          | 0/8 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": [],
    "missing_count": 0,
    "missing_percent": 0.0,
    "unexpected_percent_total": 0.0,
    "unexpected_percent_nonmissing": 0.0
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [127]:

validator.expect_column_quantile_values_to_be_between(column='llcrnrlat', allow_relative_error=False, quantile_ranges={'quantiles': [0.25, 0.5, 0.75], 'value_ranges': [[31.504089053000357, 31.504089053000357], [35.90351723295371, 35.90351723295371], [40.25077938682679, 40.25077938682679]]}, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'llcrnrlat'}, 'metric_dependencies': None, 'metric_name': 'column.quantile_values', 'metric_value_kwargs': {'allow_relative_error': False, 'quantiles': [0.25, 0.5, 0.75]}}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": {
      "quantiles": [
        0.25,
        0.5,
        0.75
      ],
      "values": [
        31.504089053000357,
        35.90351723295371,
        40.25077938682679
      ]
    },
    "details": {
      "success_details": [
        true,
        true,
        true
      ]
    }
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [128]:

validator.expect_column_median_to_be_between(column='llcrnrlat', max_value=35.90351723295371, min_value=35.90351723295371, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'llcrnrlat'}, 'metric_dependencies': None, 'metric_name': 'column.median', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 35.90351723295371
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [129]:

validator.expect_column_mean_to_be_between(column='llcrnrlat', max_value=35.88721299948105, min_value=35.88721299948105, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'llcrnrlat'}, 'metric_dependencies': None, 'metric_name': 'column.mean', 'metric_value_kwargs': None}, 'num_batches': 1}})

  and should_run_async(code)


Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 35.88721299948105
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [130]:

validator.expect_column_stdev_to_be_between(column='llcrnrlat', max_value=5.594122687133442, min_value=5.594122687133442, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'llcrnrlat'}, 'metric_dependencies': None, 'metric_name': 'column.standard_deviation', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 5.594122687133442
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

#### `llcrnrlon`

In [131]:

validator.expect_column_values_to_not_be_null(column='llcrnrlon', meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'llcrnrlon'}, 'metric_dependencies': None, 'metric_name': 'column_values.nonnull.unexpected_count', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/6 [00:00<?, ?it/s]

  return list(domain_values[: result_format["partial_unexpected_count"]])


{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": []
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [132]:

validator.expect_column_min_to_be_between(column='llcrnrlon', max_value=-127.23602309043991, min_value=-127.23602309043991, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'llcrnrlon'}, 'metric_dependencies': None, 'metric_name': 'column.min', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": -127.23602309043991
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [133]:

validator.expect_column_max_to_be_between(column='llcrnrlon', max_value=-69.59615266178442, min_value=-69.59615266178442, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'llcrnrlon'}, 'metric_dependencies': None, 'metric_name': 'column.max', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": -69.59615266178442
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [134]:

validator.expect_column_values_to_be_between(column='llcrnrlon', max_value=-69.59615266178442, min_value=-127.23602309043991, mostly=1.0, strict_max=False, strict_min=False, meta={'profiler_details': {'column_max_values_range_estimator': {'metric_configuration': {'domain_kwargs': {'column': 'llcrnrlon'}, 'metric_dependencies': None, 'metric_name': 'column.max', 'metric_value_kwargs': None}, 'num_batches': 1}, 'column_min_values_range_estimator': {'metric_configuration': {'domain_kwargs': {'column': 'llcrnrlon'}, 'metric_dependencies': None, 'metric_name': 'column.min', 'metric_value_kwargs': None}, 'num_batches': 1}}})

Calculating Metrics:   0%|          | 0/8 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": [],
    "missing_count": 0,
    "missing_percent": 0.0,
    "unexpected_percent_total": 0.0,
    "unexpected_percent_nonmissing": 0.0
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [135]:

validator.expect_column_quantile_values_to_be_between(column='llcrnrlon', allow_relative_error=False, quantile_ranges={'quantiles': [0.25, 0.5, 0.75], 'value_ranges': [[-101.95866854645936, -101.95866854645936], [-93.61010329974404, -93.61010329974404], [-85.50213715244381, -85.50213715244381]]}, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'llcrnrlon'}, 'metric_dependencies': None, 'metric_name': 'column.quantile_values', 'metric_value_kwargs': {'allow_relative_error': False, 'quantiles': [0.25, 0.5, 0.75]}}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": {
      "quantiles": [
        0.25,
        0.5,
        0.75
      ],
      "values": [
        -101.95866854645936,
        -93.61010329974404,
        -85.50213715244381
      ]
    },
    "details": {
      "success_details": [
        true,
        true,
        true
      ]
    }
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [136]:

validator.expect_column_median_to_be_between(column='llcrnrlon', max_value=-93.61010329974404, min_value=-93.61010329974404, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'llcrnrlon'}, 'metric_dependencies': None, 'metric_name': 'column.median', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": -93.61010329974404
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [137]:

validator.expect_column_mean_to_be_between(column='llcrnrlon', max_value=-95.09555553043528, min_value=-95.09555553043528, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'llcrnrlon'}, 'metric_dependencies': None, 'metric_name': 'column.mean', 'metric_value_kwargs': None}, 'num_batches': 1}})

  and should_run_async(code)


Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": -95.09555553043528
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [138]:

validator.expect_column_stdev_to_be_between(column='llcrnrlon', max_value=12.521708865404335, min_value=12.521708865404335, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'llcrnrlon'}, 'metric_dependencies': None, 'metric_name': 'column.standard_deviation', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 12.521708865404335
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

#### `urcrnrlat`

In [139]:

validator.expect_column_values_to_not_be_null(column='urcrnrlat', meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'urcrnrlat'}, 'metric_dependencies': None, 'metric_name': 'column_values.nonnull.unexpected_count', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/6 [00:00<?, ?it/s]

  return list(domain_values[: result_format["partial_unexpected_count"]])


{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": []
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [140]:

validator.expect_column_min_to_be_between(column='urcrnrlat', max_value=24.88471165440152, min_value=24.88471165440152, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'urcrnrlat'}, 'metric_dependencies': None, 'metric_name': 'column.min', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 24.88471165440152
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [141]:

validator.expect_column_max_to_be_between(column='urcrnrlat', max_value=51.89677240465032, min_value=51.89677240465032, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'urcrnrlat'}, 'metric_dependencies': None, 'metric_name': 'column.max', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 51.89677240465032
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [142]:

validator.expect_column_values_to_be_between(column='urcrnrlat', max_value=51.89677240465032, min_value=24.88471165440152, mostly=1.0, strict_max=False, strict_min=False, meta={'profiler_details': {'column_max_values_range_estimator': {'metric_configuration': {'domain_kwargs': {'column': 'urcrnrlat'}, 'metric_dependencies': None, 'metric_name': 'column.max', 'metric_value_kwargs': None}, 'num_batches': 1}, 'column_min_values_range_estimator': {'metric_configuration': {'domain_kwargs': {'column': 'urcrnrlat'}, 'metric_dependencies': None, 'metric_name': 'column.min', 'metric_value_kwargs': None}, 'num_batches': 1}}})

Calculating Metrics:   0%|          | 0/8 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": [],
    "missing_count": 0,
    "missing_percent": 0.0,
    "unexpected_percent_total": 0.0,
    "unexpected_percent_nonmissing": 0.0
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [143]:

validator.expect_column_quantile_values_to_be_between(column='urcrnrlat', allow_relative_error=False, quantile_ranges={'quantiles': [0.25, 0.5, 0.75], 'value_ranges': [[34.78448218289119, 34.78448218289119], [39.16108782439054, 39.16108782439054], [43.301251558311776, 43.301251558311776]]}, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'urcrnrlat'}, 'metric_dependencies': None, 'metric_name': 'column.quantile_values', 'metric_value_kwargs': {'allow_relative_error': False, 'quantiles': [0.25, 0.5, 0.75]}}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": {
      "quantiles": [
        0.25,
        0.5,
        0.75
      ],
      "values": [
        34.78448218289119,
        39.16108782439054,
        43.301251558311776
      ]
    },
    "details": {
      "success_details": [
        true,
        true,
        true
      ]
    }
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [144]:

validator.expect_column_median_to_be_between(column='urcrnrlat', max_value=39.16108782439054, min_value=39.16108782439054, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'urcrnrlat'}, 'metric_dependencies': None, 'metric_name': 'column.median', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 39.16108782439054
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [145]:

validator.expect_column_mean_to_be_between(column='urcrnrlat', max_value=39.10037506511802, min_value=39.10037506511802, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'urcrnrlat'}, 'metric_dependencies': None, 'metric_name': 'column.mean', 'metric_value_kwargs': None}, 'num_batches': 1}})

  and should_run_async(code)


Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 39.10037506511802
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [146]:

validator.expect_column_stdev_to_be_between(column='urcrnrlat', max_value=5.636998305059644, min_value=5.636998305059644, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'urcrnrlat'}, 'metric_dependencies': None, 'metric_name': 'column.standard_deviation', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 5.636998305059644
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

#### `urcrnrlon`

In [147]:

validator.expect_column_values_to_not_be_null(column='urcrnrlon', meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'urcrnrlon'}, 'metric_dependencies': None, 'metric_name': 'column_values.nonnull.unexpected_count', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/6 [00:00<?, ?it/s]

  return list(domain_values[: result_format["partial_unexpected_count"]])


{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": []
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [148]:

validator.expect_column_min_to_be_between(column='urcrnrlon', max_value=-124.09200893291904, min_value=-124.09200893291904, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'urcrnrlon'}, 'metric_dependencies': None, 'metric_name': 'column.min', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": -124.09200893291904
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [149]:

validator.expect_column_max_to_be_between(column='urcrnrlon', max_value=-62.923893868831385, min_value=-62.923893868831385, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'urcrnrlon'}, 'metric_dependencies': None, 'metric_name': 'column.max', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": -62.923893868831385
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [150]:

validator.expect_column_values_to_be_between(column='urcrnrlon', max_value=-62.923893868831385, min_value=-124.09200893291904, mostly=1.0, strict_max=False, strict_min=False, meta={'profiler_details': {'column_max_values_range_estimator': {'metric_configuration': {'domain_kwargs': {'column': 'urcrnrlon'}, 'metric_dependencies': None, 'metric_name': 'column.max', 'metric_value_kwargs': None}, 'num_batches': 1}, 'column_min_values_range_estimator': {'metric_configuration': {'domain_kwargs': {'column': 'urcrnrlon'}, 'metric_dependencies': None, 'metric_name': 'column.min', 'metric_value_kwargs': None}, 'num_batches': 1}}})

Calculating Metrics:   0%|          | 0/8 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": [],
    "missing_count": 0,
    "missing_percent": 0.0,
    "unexpected_percent_total": 0.0,
    "unexpected_percent_nonmissing": 0.0
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [151]:

validator.expect_column_quantile_values_to_be_between(column='urcrnrlon', allow_relative_error=False, quantile_ranges={'quantiles': [0.25, 0.5, 0.75], 'value_ranges': [[-97.6054098345261, -97.6054098345261], [-88.82070045499479, -88.82070045499479], [-80.64909018058297, -80.64909018058297]]}, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'urcrnrlon'}, 'metric_dependencies': None, 'metric_name': 'column.quantile_values', 'metric_value_kwargs': {'allow_relative_error': False, 'quantiles': [0.25, 0.5, 0.75]}}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": {
      "quantiles": [
        0.25,
        0.5,
        0.75
      ],
      "values": [
        -97.6054098345261,
        -88.82070045499479,
        -80.64909018058297
      ]
    },
    "details": {
      "success_details": [
        true,
        true,
        true
      ]
    }
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [152]:

validator.expect_column_median_to_be_between(column='urcrnrlon', max_value=-88.82070045499482, min_value=-88.82070045499482, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'urcrnrlon'}, 'metric_dependencies': None, 'metric_name': 'column.median', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": -88.82070045499482
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [153]:

validator.expect_column_mean_to_be_between(column='urcrnrlon', max_value=-90.50152810067166, min_value=-90.50152810067166, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'urcrnrlon'}, 'metric_dependencies': None, 'metric_name': 'column.mean', 'metric_value_kwargs': None}, 'num_batches': 1}})

  and should_run_async(code)


Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": -90.50152810067166
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [154]:

validator.expect_column_stdev_to_be_between(column='urcrnrlon', max_value=13.103338786082888, min_value=13.103338786082888, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'urcrnrlon'}, 'metric_dependencies': None, 'metric_name': 'column.standard_deviation', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 13.103338786082888
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

#### `pct_missing`

In [155]:

validator.expect_column_values_to_not_be_null(column='pct_missing', meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'pct_missing'}, 'metric_dependencies': None, 'metric_name': 'column_values.nonnull.unexpected_count', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/6 [00:00<?, ?it/s]

  return list(domain_values[: result_format["partial_unexpected_count"]])


{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": []
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [156]:

validator.expect_column_min_to_be_between(column='pct_missing', max_value=0.0, min_value=0.0, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'pct_missing'}, 'metric_dependencies': None, 'metric_name': 'column.min', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 0.0
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [157]:

validator.expect_column_max_to_be_between(column='pct_missing', max_value=1.0, min_value=1.0, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'pct_missing'}, 'metric_dependencies': None, 'metric_name': 'column.max', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 1.0
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [158]:

validator.expect_column_values_to_be_between(column='pct_missing', max_value=1.0, min_value=0.0, mostly=1.0, strict_max=False, strict_min=False, meta={'profiler_details': {'column_max_values_range_estimator': {'metric_configuration': {'domain_kwargs': {'column': 'pct_missing'}, 'metric_dependencies': None, 'metric_name': 'column.max', 'metric_value_kwargs': None}, 'num_batches': 1}, 'column_min_values_range_estimator': {'metric_configuration': {'domain_kwargs': {'column': 'pct_missing'}, 'metric_dependencies': None, 'metric_name': 'column.min', 'metric_value_kwargs': None}, 'num_batches': 1}}})

Calculating Metrics:   0%|          | 0/8 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": [],
    "missing_count": 0,
    "missing_percent": 0.0,
    "unexpected_percent_total": 0.0,
    "unexpected_percent_nonmissing": 0.0
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [159]:

validator.expect_column_quantile_values_to_be_between(column='pct_missing', allow_relative_error=False, quantile_ranges={'quantiles': [0.25, 0.5, 0.75], 'value_ranges': [[0.0, 0.0], [0.0, 0.0], [0.0, 0.0]]}, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'pct_missing'}, 'metric_dependencies': None, 'metric_name': 'column.quantile_values', 'metric_value_kwargs': {'allow_relative_error': False, 'quantiles': [0.25, 0.5, 0.75]}}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": {
      "quantiles": [
        0.25,
        0.5,
        0.75
      ],
      "values": [
        0.0,
        0.0,
        0.0
      ]
    },
    "details": {
      "success_details": [
        true,
        true,
        true
      ]
    }
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [160]:

validator.expect_column_median_to_be_between(column='pct_missing', max_value=0.0, min_value=0.0, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'pct_missing'}, 'metric_dependencies': None, 'metric_name': 'column.median', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 0.0
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [161]:

validator.expect_column_mean_to_be_between(column='pct_missing', max_value=0.003552192379775688, min_value=0.003552192379775688, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'pct_missing'}, 'metric_dependencies': None, 'metric_name': 'column.mean', 'metric_value_kwargs': None}, 'num_batches': 1}})

  and should_run_async(code)


Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 0.003552192379775688
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [162]:

validator.expect_column_stdev_to_be_between(column='pct_missing', max_value=0.0321447250441359, min_value=0.0321447250441359, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'pct_missing'}, 'metric_dependencies': None, 'metric_name': 'column.standard_deviation', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 0.0321447250441359
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

#### `data_min`

In [163]:

validator.expect_column_min_to_be_between(column='data_min', max_value=-31718.416015625, min_value=-31718.416015625, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'data_min'}, 'metric_dependencies': None, 'metric_name': 'column.min', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": -31718.416015625
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [164]:

validator.expect_column_max_to_be_between(column='data_min', max_value=18.269269943237305, min_value=18.269269943237305, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'data_min'}, 'metric_dependencies': None, 'metric_name': 'column.max', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 18.269269943237305
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [165]:

validator.expect_column_values_to_be_between(column='data_min', max_value=18.269269943237305, min_value=-31718.416015625, mostly=1.0, strict_max=False, strict_min=False, meta={'profiler_details': {'column_max_values_range_estimator': {'metric_configuration': {'domain_kwargs': {'column': 'data_min'}, 'metric_dependencies': None, 'metric_name': 'column.max', 'metric_value_kwargs': None}, 'num_batches': 1}, 'column_min_values_range_estimator': {'metric_configuration': {'domain_kwargs': {'column': 'data_min'}, 'metric_dependencies': None, 'metric_name': 'column.min', 'metric_value_kwargs': None}, 'num_batches': 1}}})

Calculating Metrics:   0%|          | 0/8 [00:00<?, ?it/s]

  return list(domain_values[: result_format["partial_unexpected_count"]])


{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": [],
    "missing_count": 3,
    "missing_percent": 0.003947160675753908,
    "unexpected_percent_total": 0.0,
    "unexpected_percent_nonmissing": 0.0
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [166]:

validator.expect_column_quantile_values_to_be_between(column='data_min', allow_relative_error=False, quantile_ranges={'quantiles': [0.25, 0.5, 0.75], 'value_ranges': [[-54.34331130981445, -54.34331130981445], [0.0, 0.0], [0.0, 0.0]]}, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'data_min'}, 'metric_dependencies': None, 'metric_name': 'column.quantile_values', 'metric_value_kwargs': {'allow_relative_error': False, 'quantiles': [0.25, 0.5, 0.75]}}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": {
      "quantiles": [
        0.25,
        0.5,
        0.75
      ],
      "values": [
        -54.34331130981445,
        0.0,
        0.0
      ]
    },
    "details": {
      "success_details": [
        true,
        true,
        true
      ]
    }
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [167]:

validator.expect_column_median_to_be_between(column='data_min', max_value=0.0, min_value=0.0, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'data_min'}, 'metric_dependencies': None, 'metric_name': 'column.median', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 0.0
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [168]:

validator.expect_column_mean_to_be_between(column='data_min', max_value=-31.575113660166586, min_value=-31.575113660166586, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'data_min'}, 'metric_dependencies': None, 'metric_name': 'column.mean', 'metric_value_kwargs': None}, 'num_batches': 1}})

  and should_run_async(code)


Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": -31.575113660166586
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [169]:

validator.expect_column_stdev_to_be_between(column='data_min', max_value=474.0938475500106, min_value=474.0938475500106, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'data_min'}, 'metric_dependencies': None, 'metric_name': 'column.standard_deviation', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 474.0938475500106
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

#### `data_max`

In [170]:

validator.expect_column_min_to_be_between(column='data_max', max_value=-48.28739547729492, min_value=-48.28739547729492, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'data_max'}, 'metric_dependencies': None, 'metric_name': 'column.min', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": -48.28739547729492
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [171]:

validator.expect_column_max_to_be_between(column='data_max', max_value=935036.0, min_value=935036.0, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'data_max'}, 'metric_dependencies': None, 'metric_name': 'column.max', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 935036.0
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [172]:

validator.expect_column_values_to_be_between(column='data_max', max_value=935036.0, min_value=-48.28739547729492, mostly=1.0, strict_max=False, strict_min=False, meta={'profiler_details': {'column_max_values_range_estimator': {'metric_configuration': {'domain_kwargs': {'column': 'data_max'}, 'metric_dependencies': None, 'metric_name': 'column.max', 'metric_value_kwargs': None}, 'num_batches': 1}, 'column_min_values_range_estimator': {'metric_configuration': {'domain_kwargs': {'column': 'data_max'}, 'metric_dependencies': None, 'metric_name': 'column.min', 'metric_value_kwargs': None}, 'num_batches': 1}}})

Calculating Metrics:   0%|          | 0/8 [00:00<?, ?it/s]

  return list(domain_values[: result_format["partial_unexpected_count"]])


{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": [],
    "missing_count": 3,
    "missing_percent": 0.003947160675753908,
    "unexpected_percent_total": 0.0,
    "unexpected_percent_nonmissing": 0.0
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [173]:

validator.expect_column_quantile_values_to_be_between(column='data_max', allow_relative_error=False, quantile_ranges={'quantiles': [0.25, 0.5, 0.75], 'value_ranges': [[0.1532760560512542, 0.1532760560512542], [25.870397567749023, 25.870397567749023], [254.0, 254.0]]}, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'data_max'}, 'metric_dependencies': None, 'metric_name': 'column.quantile_values', 'metric_value_kwargs': {'allow_relative_error': False, 'quantiles': [0.25, 0.5, 0.75]}}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": {
      "quantiles": [
        0.25,
        0.5,
        0.75
      ],
      "values": [
        0.1532760560512542,
        25.870397567749023,
        254.0
      ]
    },
    "details": {
      "success_details": [
        true,
        true,
        true
      ]
    }
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [174]:

validator.expect_column_median_to_be_between(column='data_max', max_value=25.870397567749023, min_value=25.870397567749023, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'data_max'}, 'metric_dependencies': None, 'metric_name': 'column.median', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 25.870397567749023
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [175]:

validator.expect_column_mean_to_be_between(column='data_max', max_value=34620.575060338226, min_value=34620.575060338226, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'data_max'}, 'metric_dependencies': None, 'metric_name': 'column.mean', 'metric_value_kwargs': None}, 'num_batches': 1}})

  and should_run_async(code)


Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 34620.575060338226
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [176]:

validator.expect_column_stdev_to_be_between(column='data_max', max_value=93853.56373709308, min_value=93853.56373709308, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'data_max'}, 'metric_dependencies': None, 'metric_name': 'column.standard_deviation', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 93853.56373709308
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

#### `event_type`

In [177]:

validator.expect_column_value_lengths_to_be_between(column='event_type', max_value=17, min_value=4, mostly=1.0, strict_max=False, strict_min=False, meta={'profiler_details': {'column_max_length_range_estimator': {'metric_configuration': {'domain_kwargs': {'column': 'event_type'}, 'metric_dependencies': None, 'metric_name': 'column_values.length.max', 'metric_value_kwargs': None}, 'num_batches': 1}, 'column_min_length_range_estimator': {'metric_configuration': {'domain_kwargs': {'column': 'event_type'}, 'metric_dependencies': None, 'metric_name': 'column_values.length.min', 'metric_value_kwargs': None}, 'num_batches': 1}}})

Calculating Metrics:   0%|          | 0/9 [00:00<?, ?it/s]

  return list(domain_values[: result_format["partial_unexpected_count"]])


{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": [],
    "missing_count": 59360,
    "missing_percent": 78.10115257091732,
    "unexpected_percent_total": 0.0,
    "unexpected_percent_nonmissing": 0.0
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [178]:

validator.expect_column_values_to_match_regex(column='event_type', mostly=1.0, regex='[A-Za-z0-9\.,;:!?()\"'%\-]+', meta={'profiler_details': {'evaluated_regexes': {'(?:25[0-5]|2[0-4]\\d|[01]\\d{2}|\\d{1,2})(?:.(?:25[0-5]|2[0-4]\\d|[01]\\d{2}|\\d{1,2})){3}': 0.0, '-?\\d+': 0.0, '-?\\d+(?:\\.\\d*)?': 0.0, '<\\/?(?:p|a|b|img)(?: \\/)?>': 0.0, '[A-Za-z0-9\\.,;:!?()\\"\'%\\-]+': 1.0, '\\b[0-9a-fA-F]{8}\\b-[0-9a-fA-F]{4}-[0-5][0-9a-fA-F]{3}-[089ab][0-9a-fA-F]{3}-\\b[0-9a-fA-F]{12}\\b ': 0.0, '\\d+': 0.0, '\\s+$': 0.0, '^\\s+': 0.0, 'https?:\\/\\/(?:www\\.)?[-a-zA-Z0-9@:%._\\+~#=]{2,255}\\.[a-z]{2,6}\\b(?:[-a-zA-Z0-9@:%_\\+.~#()?&//=]*)': 0.0}, 'success_ratio': 1.0}})

  validator.expect_column_values_to_match_regex(column='event_type', mostly=1.0, regex='[A-Za-z0-9\.,;:!?()\"'%\-]+', meta={'profiler_details': {'evaluated_regexes': {'(?:25[0-5]|2[0-4]\\d|[01]\\d{2}|\\d{1,2})(?:.(?:25[0-5]|2[0-4]\\d|[01]\\d{2}|\\d{1,2})){3}': 0.0, '-?\\d+': 0.0, '-?\\d+(?:\\.\\d*)?': 0.0, '<\\/?(?:p|a|b|img)(?: \\/)?>': 0.0, '[A-Za-z0-9\\.,;:!?()\\"\'%\\-]+': 1.0, '\\b[0-9a-fA-F]{8}\\b-[0-9a-fA-F]{4}-[0-5][0-9a-fA-F]{3}-[089ab][0-9a-fA-F]{3}-\\b[0-9a-fA-F]{12}\\b ': 0.0, '\\d+': 0.0, '\\s+$': 0.0, '^\\s+': 0.0, 'https?:\\/\\/(?:www\\.)?[-a-zA-Z0-9@:%._\\+~#=]{2,255}\\.[a-z]{2,6}\\b(?:[-a-zA-Z0-9@:%_\\+.~#()?&//=]*)': 0.0}, 'success_ratio': 1.0}})


SyntaxError: unexpected character after line continuation character (<ipython-input-178-6c30f4b58ac5>, line 1)

In [179]:

validator.expect_column_values_to_be_in_set(column='event_type', mostly=1.0, value_set=['Thunderstorm Wind', 'Funnel Cloud', 'Flash Flood', 'Lightning', 'Hail', 'Tornado', 'Heavy Rain', 'Flood'], meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'event_type'}, 'metric_dependencies': None, 'metric_name': 'column.distinct_values', 'metric_value_kwargs': None}, 'num_batches': 1, 'parse_strings_as_datetimes': False}})

Calculating Metrics:   0%|          | 0/8 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "element_count": 76004,
    "unexpected_count": 0,
    "unexpected_percent": 0.0,
    "partial_unexpected_list": [],
    "missing_count": 59360,
    "missing_percent": 78.10115257091732,
    "unexpected_percent_total": 0.0,
    "unexpected_percent_nonmissing": 0.0
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [180]:

validator.expect_column_unique_value_count_to_be_between(column='event_type', max_value=8, min_value=8, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'event_type'}, 'metric_dependencies': None, 'metric_name': 'column.distinct_values.count', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/4 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 8
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

In [181]:

validator.expect_column_proportion_of_unique_values_to_be_between(column='event_type', max_value=0.0004806536890170632, min_value=0.0004806536890170632, strict_max=False, strict_min=False, meta={'profiler_details': {'metric_configuration': {'domain_kwargs': {'column': 'event_type'}, 'metric_dependencies': None, 'metric_name': 'column.unique_proportion', 'metric_value_kwargs': None}, 'num_batches': 1}})

Calculating Metrics:   0%|          | 0/7 [00:00<?, ?it/s]

{
  "success": true,
  "result": {
    "observed_value": 0.0004806536890170632
  },
  "meta": {},
  "exception_info": {
    "raised_exception": false,
    "exception_traceback": null,
    "exception_message": null
  }
}

## Review & Save Your Expectations

Let's save the expectation suite as a JSON file in the `great_expectations/expectations` directory of your project.

Let's now rebuild your Data Docs, which helps you communicate about your data with both machines and humans.

In [182]:
print(validator.get_expectation_suite(discard_failed_expectations=False))
validator.save_expectation_suite(discard_failed_expectations=False)

checkpoint_config = {
    "class_name": "SimpleCheckpoint",
    "validations": [
        {
            "batch_request": batch_request,
            "expectation_suite_name": expectation_suite_name
        }
    ]
}
checkpoint = SimpleCheckpoint(
    f"{validator.active_batch_definition.data_asset_name}_{expectation_suite_name}",
    context,
    **checkpoint_config
)
checkpoint_result = checkpoint.run()

context.build_data_docs()

validation_result_identifier = checkpoint_result.list_validation_result_identifiers()[0]
context.open_data_docs(resource_identifier=validation_result_identifier)

2022-11-09T23:05:11-0500 - INFO - 	85 expectation(s) included in expectation_suite.
{
  "meta": {
    "citations": [
      {
        "citation_date": "2022-10-31T06:35:42.022783Z",
        "comment": "Created by effective Rule-Based Profiler of OnboardingDataAssistant with the configuration included.\n"
      },
      {
        "batch_request": {
          "data_asset_name": "CATALOG.csv",
          "data_connector_name": "default_inferred_data_connector_name",
          "datasource_name": "SEVIR_CATALOG_1",
          "limit": 1000
        },
        "citation_date": "2022-11-09T22:17:05.547067Z",
        "comment": "Created suite added via CLI"
      }
    ],
    "great_expectations_version": "0.15.29"
  },
  "expectations": [
    {
      "kwargs": {
        "max_value": 76004,
        "min_value": 76004
      },
      "meta": {},
      "expectation_type": "expect_table_row_count_to_be_between"
    },
    {
      "kwargs": {
        "column_set": [
          "event_id",
          "epi

2022-11-09T23:05:12-0500 - INFO - 	85 expectation(s) included in expectation_suite.


  df = reader_fn(path, **reader_options)


Calculating Metrics:   0%|          | 0/159 [00:00<?, ?it/s]

  return list(domain_values[: result_format["partial_unexpected_count"]])
