# Libraries

In [1]:
import os
import time

import tfx
import tensorflow as tf
import tensorflow_data_validation as tfdv
import tensorflow_model_analysis as tfma
import tensorflow_transform as tft

from tensorflow_metadata.proto.v0 import schema_pb2

from tfx.orchestration.experimental.interactive.interactive_context import InteractiveContext
from tfx.proto import example_gen_pb2
from tfx.components import CsvExampleGen
from tfx.components import SchemaGen
from tfx.components.common_nodes.importer_node import ImporterNode
from tfx.components import ExampleValidator
from tfx.components import Transform

# Running Data Cleaning File

In [2]:
!python clean_data.py

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['Wages'] = df['Wages'].str.replace(',', '')
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['Wages'] = df['Wages'].str.replace('€ ', '')
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['Wages'] = df['Wages'].str.replace(' pw', '')
A value is trying to be set on a copy of a slice from a DataF

# Artifact, Serving Model, Data Locations

In [3]:
ARTIFACT_STORE = os.path.join(os.sep, 'Users', 'CarlosMonsivais', 'Desktop', 'TFX_football_manager_2022', 'Artifacts')
SERVING_MODEL_DIR = os.path.join(os.sep, 'Users', 'CarlosMonsivais', 'Desktop', 'TFX_football_manager_2022', 'Model')
DATA_ROOT = '/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Clean_Data'

print('Artifact Storage: {}'.format(ARTIFACT_STORE))
print('Serving Model Storage: {}'.format(SERVING_MODEL_DIR))
print('Data Root: {}'.format(DATA_ROOT))

Artifact Storage: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts
Serving Model Storage: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Model
Data Root: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Clean_Data


# Pipeline Names

In [4]:
PIPELINE_NAME = 'tfx-football-pipeline'
PIPELINE_ROOT = os.path.join(ARTIFACT_STORE, PIPELINE_NAME, time.strftime("%Y%m%d_%H%M%S"))

# Creating a directory in the Artifact Storage variable where the pipline metadata will be stored using this timestamp.
os.makedirs(PIPELINE_ROOT, exist_ok = True)

print('Created a directory here:{} \nwhere the pipleine metadata artifacts will be stored.'.format(PIPELINE_ROOT))

Created a directory here:/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422 
where the pipleine metadata artifacts will be stored.


# Only for Jupyter Notebook Interactivity

In [5]:
context = InteractiveContext(pipeline_name = PIPELINE_NAME,
                             pipeline_root = PIPELINE_ROOT,
                             metadata_connection_config = None)



# Reading in Data

In [6]:
input_config = example_gen_pb2.Input(splits=[example_gen_pb2.Input.Split(name = 'clean_football_manager_22', 
                                                                         pattern = '*.csv')])

In [7]:
# Doing an 80:20 Train Eval Split
output_config = example_gen_pb2.Output(split_config = example_gen_pb2.SplitConfig(splits=[example_gen_pb2.SplitConfig.Split(name = 'train_data', hash_buckets = 4),
                                                                                          example_gen_pb2.SplitConfig.Split(name = 'test_data', hash_buckets = 1)]))

In [8]:
example_gen = tfx.components.CsvExampleGen(input_base = DATA_ROOT,
                                           input_config = input_config,
                                           output_config = output_config)

In [9]:
context.run(example_gen)





0,1
.execution_id,1
.component,"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } CsvExampleGen at 0x7fd57c152370.inputs{}.outputs['examples'] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'Examples' (1 artifact) at 0x7fd57c152fd0.type_nameExamples._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Examples' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1) at 0x7fd57c178100.type<class 'tfx.types.standard_artifacts.Examples'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1.span0.split_names[""train_data"", ""test_data""].version0.exec_properties['input_base']/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Clean_Data['input_config']{  ""splits"": [  {  ""name"": ""clean_football_manager_22"",  ""pattern"": ""*.csv""  }  ] }['output_config']{  ""split_config"": {  ""splits"": [  {  ""hash_buckets"": 4,  ""name"": ""train_data""  },  {  ""hash_buckets"": 1,  ""name"": ""test_data""  }  ]  } }['output_data_format']6['custom_config']None['range_config']None['span']0['version']None['input_fingerprint']split:clean_football_manager_22,num_files:1,total_bytes:46907884,xor_checksum:1642981346,sum_checksum:1642981346"
.component.inputs,{}
.component.outputs,"['examples'] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'Examples' (1 artifact) at 0x7fd57c152fd0.type_nameExamples._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Examples' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1) at 0x7fd57c178100.type<class 'tfx.types.standard_artifacts.Examples'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1.span0.split_names[""train_data"", ""test_data""].version0"

0,1
.inputs,{}
.outputs,"['examples'] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'Examples' (1 artifact) at 0x7fd57c152fd0.type_nameExamples._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Examples' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1) at 0x7fd57c178100.type<class 'tfx.types.standard_artifacts.Examples'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1.span0.split_names[""train_data"", ""test_data""].version0"
.exec_properties,"['input_base']/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Clean_Data['input_config']{  ""splits"": [  {  ""name"": ""clean_football_manager_22"",  ""pattern"": ""*.csv""  }  ] }['output_config']{  ""split_config"": {  ""splits"": [  {  ""hash_buckets"": 4,  ""name"": ""train_data""  },  {  ""hash_buckets"": 1,  ""name"": ""test_data""  }  ]  } }['output_data_format']6['custom_config']None['range_config']None['span']0['version']None['input_fingerprint']split:clean_football_manager_22,num_files:1,total_bytes:46907884,xor_checksum:1642981346,sum_checksum:1642981346"

0,1
['examples'],"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'Examples' (1 artifact) at 0x7fd57c152fd0.type_nameExamples._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Examples' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1) at 0x7fd57c178100.type<class 'tfx.types.standard_artifacts.Examples'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1.span0.split_names[""train_data"", ""test_data""].version0"

0,1
.type_name,Examples
._artifacts,"[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Examples' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1) at 0x7fd57c178100.type<class 'tfx.types.standard_artifacts.Examples'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1.span0.split_names[""train_data"", ""test_data""].version0"

0,1
[0],"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Examples' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1) at 0x7fd57c178100.type<class 'tfx.types.standard_artifacts.Examples'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1.span0.split_names[""train_data"", ""test_data""].version0"

0,1
.type,<class 'tfx.types.standard_artifacts.Examples'>
.uri,/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1
.span,0
.split_names,"[""train_data"", ""test_data""]"
.version,0

0,1
['input_base'],/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Clean_Data
['input_config'],"{  ""splits"": [  {  ""name"": ""clean_football_manager_22"",  ""pattern"": ""*.csv""  }  ] }"
['output_config'],"{  ""split_config"": {  ""splits"": [  {  ""hash_buckets"": 4,  ""name"": ""train_data""  },  {  ""hash_buckets"": 1,  ""name"": ""test_data""  }  ]  } }"
['output_data_format'],6
['custom_config'],
['range_config'],
['span'],0
['version'],
['input_fingerprint'],"split:clean_football_manager_22,num_files:1,total_bytes:46907884,xor_checksum:1642981346,sum_checksum:1642981346"

0,1
['examples'],"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'Examples' (1 artifact) at 0x7fd57c152fd0.type_nameExamples._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Examples' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1) at 0x7fd57c178100.type<class 'tfx.types.standard_artifacts.Examples'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1.span0.split_names[""train_data"", ""test_data""].version0"

0,1
.type_name,Examples
._artifacts,"[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Examples' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1) at 0x7fd57c178100.type<class 'tfx.types.standard_artifacts.Examples'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1.span0.split_names[""train_data"", ""test_data""].version0"

0,1
[0],"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Examples' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1) at 0x7fd57c178100.type<class 'tfx.types.standard_artifacts.Examples'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1.span0.split_names[""train_data"", ""test_data""].version0"

0,1
.type,<class 'tfx.types.standard_artifacts.Examples'>
.uri,/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1
.span,0
.split_names,"[""train_data"", ""test_data""]"
.version,0


In [10]:
# Shows features
examples_uri = example_gen.outputs['examples'].get()[0].uri
tfrecord_filenames = [os.path.join(examples_uri, 'train_data', name)
                      for name in os.listdir(os.path.join(examples_uri, 'train_data'))]
dataset = tf.data.TFRecordDataset(tfrecord_filenames, compression_type="GZIP")
for tfrecord in dataset.take(2):
  example = tf.train.Example()
  example.ParseFromString(tfrecord.numpy())
  for name, feature in example.features.feature.items():
    if feature.HasField('bytes_list'):
        value = feature.bytes_list.value
    if feature.HasField('float_list'):
        value = feature.float_list.value
    if feature.HasField('int64_list'):
        value = feature.int64_list.value
    print('{}: {}'.format(name, value))
  print('******')

Concentration: [10]
Balance: [17]
Anticipation: [15]
Long Throws: [3.0]
First Touch: [16]
Corners: [3.0]
Communication: []
Heading: [17.0]
Crossing: [6.0]
Stamina: [18]
Free Kick Taking: [15]
Caps: [22.0]
Dribbling: [14.0]
Agility: [13]
Penalty Taking: [13]
Flair: [18]
Tackling: [13.0]
Composure: [10]
Kicking: []
Bravery: [17]
Command of Area: []
Technique: [16]
Natural Fitness: [20]
Off the Ball: [16]
Long Shots: [15.0]
Sell value: [73441416.0]
Throwing: []
Wages: [113890.0]
Contract end: [b'2024-06-30']
Determination: [17]
Weight: [82]
One on Ones: []
Reflexes: []
Punching (Tendency): []
Positioning: [11]
Marking: [9.0]
Eccentricity: []
Rushing Out (Tendency): []
Passing: [16]
Potential: [85.0]
Decisions: [13]
Name: [b'Sergej Milinkovic-Savic']
Vision: [15]
Foot: [b'Right']
Ability: [82.0]
Position: [b'MC']
Handling: []
Acceleration: [13]
Goals: [3.0]
Club: [b'Lazio']
Aggression: [14]
Length: [191]
Finishing: [15.0]
Pace: [12]
Nation: [b'Serbia']
Unique ID: [62127037]
Strength: [17]


# StaisticsGen Component

In [11]:
statistics_gen = tfx.components.StatisticsGen(examples = example_gen.outputs['examples'])

In [12]:
context.run(statistics_gen)



0,1
.execution_id,2
.component,"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } StatisticsGen at 0x7fd56e4ba5e0.inputs['examples'] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'Examples' (1 artifact) at 0x7fd57c152fd0.type_nameExamples._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Examples' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1) at 0x7fd57c178100.type<class 'tfx.types.standard_artifacts.Examples'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1.span0.split_names[""train_data"", ""test_data""].version0.outputs['statistics'] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'ExampleStatistics' (1 artifact) at 0x7fd56e4ba220.type_nameExampleStatistics._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""].exec_properties['stats_options_json']None['exclude_splits'][]"
.component.inputs,"['examples'] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'Examples' (1 artifact) at 0x7fd57c152fd0.type_nameExamples._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Examples' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1) at 0x7fd57c178100.type<class 'tfx.types.standard_artifacts.Examples'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1.span0.split_names[""train_data"", ""test_data""].version0"
.component.outputs,"['statistics'] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'ExampleStatistics' (1 artifact) at 0x7fd56e4ba220.type_nameExampleStatistics._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""]"

0,1
.inputs,"['examples'] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'Examples' (1 artifact) at 0x7fd57c152fd0.type_nameExamples._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Examples' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1) at 0x7fd57c178100.type<class 'tfx.types.standard_artifacts.Examples'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1.span0.split_names[""train_data"", ""test_data""].version0"
.outputs,"['statistics'] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'ExampleStatistics' (1 artifact) at 0x7fd56e4ba220.type_nameExampleStatistics._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""]"
.exec_properties,['stats_options_json']None['exclude_splits'][]

0,1
['examples'],"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'Examples' (1 artifact) at 0x7fd57c152fd0.type_nameExamples._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Examples' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1) at 0x7fd57c178100.type<class 'tfx.types.standard_artifacts.Examples'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1.span0.split_names[""train_data"", ""test_data""].version0"

0,1
.type_name,Examples
._artifacts,"[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Examples' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1) at 0x7fd57c178100.type<class 'tfx.types.standard_artifacts.Examples'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1.span0.split_names[""train_data"", ""test_data""].version0"

0,1
[0],"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Examples' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1) at 0x7fd57c178100.type<class 'tfx.types.standard_artifacts.Examples'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1.span0.split_names[""train_data"", ""test_data""].version0"

0,1
.type,<class 'tfx.types.standard_artifacts.Examples'>
.uri,/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1
.span,0
.split_names,"[""train_data"", ""test_data""]"
.version,0

0,1
['statistics'],"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'ExampleStatistics' (1 artifact) at 0x7fd56e4ba220.type_nameExampleStatistics._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""]"

0,1
.type_name,ExampleStatistics
._artifacts,"[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""]"

0,1
[0],"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""]"

0,1
.type,<class 'tfx.types.standard_artifacts.ExampleStatistics'>
.uri,/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2
.span,0
.split_names,"[""train_data"", ""test_data""]"

0,1
['stats_options_json'],
['exclude_splits'],[]

0,1
['examples'],"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'Examples' (1 artifact) at 0x7fd57c152fd0.type_nameExamples._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Examples' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1) at 0x7fd57c178100.type<class 'tfx.types.standard_artifacts.Examples'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1.span0.split_names[""train_data"", ""test_data""].version0"

0,1
.type_name,Examples
._artifacts,"[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Examples' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1) at 0x7fd57c178100.type<class 'tfx.types.standard_artifacts.Examples'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1.span0.split_names[""train_data"", ""test_data""].version0"

0,1
[0],"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Examples' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1) at 0x7fd57c178100.type<class 'tfx.types.standard_artifacts.Examples'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1.span0.split_names[""train_data"", ""test_data""].version0"

0,1
.type,<class 'tfx.types.standard_artifacts.Examples'>
.uri,/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1
.span,0
.split_names,"[""train_data"", ""test_data""]"
.version,0

0,1
['statistics'],"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'ExampleStatistics' (1 artifact) at 0x7fd56e4ba220.type_nameExampleStatistics._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""]"

0,1
.type_name,ExampleStatistics
._artifacts,"[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""]"

0,1
[0],"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""]"

0,1
.type,<class 'tfx.types.standard_artifacts.ExampleStatistics'>
.uri,/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2
.span,0
.split_names,"[""train_data"", ""test_data""]"


In [13]:
context.show(statistics_gen.outputs['statistics'])

Instructions for updating:
Use eager execution and: 
`tf.data.TFRecordDataset(path)`


Instructions for updating:
Use eager execution and: 
`tf.data.TFRecordDataset(path)`


# SchemaGen

In [14]:
schema_gen = SchemaGen(statistics=statistics_gen.outputs['statistics'],
                       infer_feature_shape=False)

In [15]:
context.run(schema_gen)

0,1
.execution_id,3
.component,"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } SchemaGen at 0x7fd50cccabb0.inputs['statistics'] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'ExampleStatistics' (1 artifact) at 0x7fd56e4ba220.type_nameExampleStatistics._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""].outputs['schema'] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'Schema' (1 artifact) at 0x7fd50ccca820.type_nameSchema._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Schema' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3) at 0x7fd56e487370.type<class 'tfx.types.standard_artifacts.Schema'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3.exec_properties['infer_feature_shape']0['exclude_splits'][]"
.component.inputs,"['statistics'] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'ExampleStatistics' (1 artifact) at 0x7fd56e4ba220.type_nameExampleStatistics._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""]"
.component.outputs,['schema'] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'Schema' (1 artifact) at 0x7fd50ccca820.type_nameSchema._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Schema' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3) at 0x7fd56e487370.type<class 'tfx.types.standard_artifacts.Schema'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3

0,1
.inputs,"['statistics'] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'ExampleStatistics' (1 artifact) at 0x7fd56e4ba220.type_nameExampleStatistics._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""]"
.outputs,['schema'] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'Schema' (1 artifact) at 0x7fd50ccca820.type_nameSchema._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Schema' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3) at 0x7fd56e487370.type<class 'tfx.types.standard_artifacts.Schema'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3
.exec_properties,['infer_feature_shape']0['exclude_splits'][]

0,1
['statistics'],"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'ExampleStatistics' (1 artifact) at 0x7fd56e4ba220.type_nameExampleStatistics._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""]"

0,1
.type_name,ExampleStatistics
._artifacts,"[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""]"

0,1
[0],"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""]"

0,1
.type,<class 'tfx.types.standard_artifacts.ExampleStatistics'>
.uri,/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2
.span,0
.split_names,"[""train_data"", ""test_data""]"

0,1
['schema'],function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'Schema' (1 artifact) at 0x7fd50ccca820.type_nameSchema._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Schema' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3) at 0x7fd56e487370.type<class 'tfx.types.standard_artifacts.Schema'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3

0,1
.type_name,Schema
._artifacts,[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Schema' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3) at 0x7fd56e487370.type<class 'tfx.types.standard_artifacts.Schema'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3

0,1
[0],function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Schema' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3) at 0x7fd56e487370.type<class 'tfx.types.standard_artifacts.Schema'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3

0,1
.type,<class 'tfx.types.standard_artifacts.Schema'>
.uri,/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3

0,1
['infer_feature_shape'],0
['exclude_splits'],[]

0,1
['statistics'],"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'ExampleStatistics' (1 artifact) at 0x7fd56e4ba220.type_nameExampleStatistics._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""]"

0,1
.type_name,ExampleStatistics
._artifacts,"[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""]"

0,1
[0],"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""]"

0,1
.type,<class 'tfx.types.standard_artifacts.ExampleStatistics'>
.uri,/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2
.span,0
.split_names,"[""train_data"", ""test_data""]"

0,1
['schema'],function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'Schema' (1 artifact) at 0x7fd50ccca820.type_nameSchema._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Schema' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3) at 0x7fd56e487370.type<class 'tfx.types.standard_artifacts.Schema'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3

0,1
.type_name,Schema
._artifacts,[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Schema' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3) at 0x7fd56e487370.type<class 'tfx.types.standard_artifacts.Schema'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3

0,1
[0],function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Schema' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3) at 0x7fd56e487370.type<class 'tfx.types.standard_artifacts.Schema'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3

0,1
.type,<class 'tfx.types.standard_artifacts.Schema'>
.uri,/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3


In [16]:
context.show(schema_gen.outputs['schema'])

Unnamed: 0_level_0,Type,Presence,Valency,Domain
Feature name,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
'Ability',FLOAT,required,single,-
'Acceleration',INT,required,single,-
'Aerial Reach',FLOAT,required,,-
'Age',INT,required,single,-
'Aggression',INT,required,single,-
...,...,...,...,...
'Unique ID',INT,required,single,-
'Vision',INT,required,single,-
'Wages',FLOAT,required,,-
'Weight',INT,required,single,-


  pd.set_option('max_colwidth', -1)


Unnamed: 0_level_0,Values
Domain,Unnamed: 1_level_1
'Foot',"'Both', 'Left', 'Right'"


## Updating SchemaGen File (In case you want to make any changes to the file.)

In [None]:
# You can chage this file to customize it as you want it for your schema.
schema_proto_path = '{}/{}'.format(schema_gen.outputs['schema'].get()[0].uri, 'schema.pbtxt')
schema = tfdv.load_schema_text(schema_proto_path)

In [None]:
# tfdv.set_domain(schema, 'Cover_Type', schema_pb2.IntDomain(name='Cover_Type', min=0, max=6, is_categorical=True))   (for categorical variable)
tfdv.set_domain(schema, 'Ability',  schema_pb2.IntDomain(name='Ability', min=0, max=20, ))

In [None]:
schema_dir = os.path.join(ARTIFACT_STORE, 'schema')
tf.io.gfile.makedirs(schema_dir)
schema_file = os.path.join(schema_dir, 'schema.pbtxt')

tfdv.write_schema_text(schema, schema_file)

!cat {schema_file}

In [None]:
schema_importer = ImporterNode(instance_name = 'Schema_Importer',
                               source_uri = schema_dir,
                               artifact_type=tfx.types.standard_artifacts.Schema,
                               reimport=False)

In [None]:
context.run(schema_importer)

In [None]:
context.show(schema_importer.outputs['result'])

# Example Validator (Anomaly Detection)

In [17]:
# Only use if the schema_importer is one that you edited 

# example_validator = ExampleValidator(instance_name = "Data_Validation",
#                                      statistics = statistics_gen.outputs['statistics'],
#                                      schema = schema_importer.outputs['result'])


example_validator = ExampleValidator(instance_name = "Data_Validation",
                                     statistics = statistics_gen.outputs['statistics'],
                                     schema = schema_gen.outputs['schema'])



In [18]:
context.run(example_validator)

0,1
.execution_id,4
.component,"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } ExampleValidator at 0x7fd50cd963a0.inputs['statistics'] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'ExampleStatistics' (1 artifact) at 0x7fd56e4ba220.type_nameExampleStatistics._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""]['schema'] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'Schema' (1 artifact) at 0x7fd50ccca820.type_nameSchema._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Schema' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3) at 0x7fd56e487370.type<class 'tfx.types.standard_artifacts.Schema'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3.outputs['anomalies'] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'ExampleAnomalies' (1 artifact) at 0x7fd50cd966a0.type_nameExampleAnomalies._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleAnomalies' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/ExampleValidator.Data_Validation/anomalies/4) at 0x7fd50cd96670.type<class 'tfx.types.standard_artifacts.ExampleAnomalies'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/ExampleValidator.Data_Validation/anomalies/4.span0.split_names[""train_data"", ""test_data""].exec_properties['exclude_splits'][]"
.component.inputs,"['statistics'] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'ExampleStatistics' (1 artifact) at 0x7fd56e4ba220.type_nameExampleStatistics._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""]['schema'] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'Schema' (1 artifact) at 0x7fd50ccca820.type_nameSchema._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Schema' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3) at 0x7fd56e487370.type<class 'tfx.types.standard_artifacts.Schema'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3"
.component.outputs,"['anomalies'] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'ExampleAnomalies' (1 artifact) at 0x7fd50cd966a0.type_nameExampleAnomalies._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleAnomalies' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/ExampleValidator.Data_Validation/anomalies/4) at 0x7fd50cd96670.type<class 'tfx.types.standard_artifacts.ExampleAnomalies'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/ExampleValidator.Data_Validation/anomalies/4.span0.split_names[""train_data"", ""test_data""]"

0,1
.inputs,"['statistics'] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'ExampleStatistics' (1 artifact) at 0x7fd56e4ba220.type_nameExampleStatistics._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""]['schema'] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'Schema' (1 artifact) at 0x7fd50ccca820.type_nameSchema._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Schema' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3) at 0x7fd56e487370.type<class 'tfx.types.standard_artifacts.Schema'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3"
.outputs,"['anomalies'] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'ExampleAnomalies' (1 artifact) at 0x7fd50cd966a0.type_nameExampleAnomalies._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleAnomalies' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/ExampleValidator.Data_Validation/anomalies/4) at 0x7fd50cd96670.type<class 'tfx.types.standard_artifacts.ExampleAnomalies'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/ExampleValidator.Data_Validation/anomalies/4.span0.split_names[""train_data"", ""test_data""]"
.exec_properties,['exclude_splits'][]

0,1
['statistics'],"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'ExampleStatistics' (1 artifact) at 0x7fd56e4ba220.type_nameExampleStatistics._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""]"
['schema'],function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'Schema' (1 artifact) at 0x7fd50ccca820.type_nameSchema._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Schema' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3) at 0x7fd56e487370.type<class 'tfx.types.standard_artifacts.Schema'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3

0,1
.type_name,ExampleStatistics
._artifacts,"[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""]"

0,1
[0],"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""]"

0,1
.type,<class 'tfx.types.standard_artifacts.ExampleStatistics'>
.uri,/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2
.span,0
.split_names,"[""train_data"", ""test_data""]"

0,1
.type_name,Schema
._artifacts,[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Schema' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3) at 0x7fd56e487370.type<class 'tfx.types.standard_artifacts.Schema'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3

0,1
[0],function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Schema' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3) at 0x7fd56e487370.type<class 'tfx.types.standard_artifacts.Schema'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3

0,1
.type,<class 'tfx.types.standard_artifacts.Schema'>
.uri,/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3

0,1
['anomalies'],"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'ExampleAnomalies' (1 artifact) at 0x7fd50cd966a0.type_nameExampleAnomalies._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleAnomalies' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/ExampleValidator.Data_Validation/anomalies/4) at 0x7fd50cd96670.type<class 'tfx.types.standard_artifacts.ExampleAnomalies'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/ExampleValidator.Data_Validation/anomalies/4.span0.split_names[""train_data"", ""test_data""]"

0,1
.type_name,ExampleAnomalies
._artifacts,"[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleAnomalies' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/ExampleValidator.Data_Validation/anomalies/4) at 0x7fd50cd96670.type<class 'tfx.types.standard_artifacts.ExampleAnomalies'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/ExampleValidator.Data_Validation/anomalies/4.span0.split_names[""train_data"", ""test_data""]"

0,1
[0],"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleAnomalies' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/ExampleValidator.Data_Validation/anomalies/4) at 0x7fd50cd96670.type<class 'tfx.types.standard_artifacts.ExampleAnomalies'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/ExampleValidator.Data_Validation/anomalies/4.span0.split_names[""train_data"", ""test_data""]"

0,1
.type,<class 'tfx.types.standard_artifacts.ExampleAnomalies'>
.uri,/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/ExampleValidator.Data_Validation/anomalies/4
.span,0
.split_names,"[""train_data"", ""test_data""]"

0,1
['exclude_splits'],[]

0,1
['statistics'],"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'ExampleStatistics' (1 artifact) at 0x7fd56e4ba220.type_nameExampleStatistics._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""]"
['schema'],function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'Schema' (1 artifact) at 0x7fd50ccca820.type_nameSchema._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Schema' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3) at 0x7fd56e487370.type<class 'tfx.types.standard_artifacts.Schema'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3

0,1
.type_name,ExampleStatistics
._artifacts,"[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""]"

0,1
[0],"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleStatistics' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2) at 0x7fd57cc63610.type<class 'tfx.types.standard_artifacts.ExampleStatistics'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2.span0.split_names[""train_data"", ""test_data""]"

0,1
.type,<class 'tfx.types.standard_artifacts.ExampleStatistics'>
.uri,/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/StatisticsGen/statistics/2
.span,0
.split_names,"[""train_data"", ""test_data""]"

0,1
.type_name,Schema
._artifacts,[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Schema' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3) at 0x7fd56e487370.type<class 'tfx.types.standard_artifacts.Schema'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3

0,1
[0],function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Schema' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3) at 0x7fd56e487370.type<class 'tfx.types.standard_artifacts.Schema'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3

0,1
.type,<class 'tfx.types.standard_artifacts.Schema'>
.uri,/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/SchemaGen/schema/3

0,1
['anomalies'],"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Channel of type 'ExampleAnomalies' (1 artifact) at 0x7fd50cd966a0.type_nameExampleAnomalies._artifacts[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleAnomalies' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/ExampleValidator.Data_Validation/anomalies/4) at 0x7fd50cd96670.type<class 'tfx.types.standard_artifacts.ExampleAnomalies'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/ExampleValidator.Data_Validation/anomalies/4.span0.split_names[""train_data"", ""test_data""]"

0,1
.type_name,ExampleAnomalies
._artifacts,"[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleAnomalies' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/ExampleValidator.Data_Validation/anomalies/4) at 0x7fd50cd96670.type<class 'tfx.types.standard_artifacts.ExampleAnomalies'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/ExampleValidator.Data_Validation/anomalies/4.span0.split_names[""train_data"", ""test_data""]"

0,1
[0],"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'ExampleAnomalies' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/ExampleValidator.Data_Validation/anomalies/4) at 0x7fd50cd96670.type<class 'tfx.types.standard_artifacts.ExampleAnomalies'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/ExampleValidator.Data_Validation/anomalies/4.span0.split_names[""train_data"", ""test_data""]"

0,1
.type,<class 'tfx.types.standard_artifacts.ExampleAnomalies'>
.uri,/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/ExampleValidator.Data_Validation/anomalies/4
.span,0
.split_names,"[""train_data"", ""test_data""]"


In [19]:
train_uri = example_validator.outputs['anomalies'].get()[0].uri
train_anomalies_filename = os.path.join(train_uri, "train/anomalies.pbtxt")

In [20]:
train_anomalies_filename

'/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/ExampleValidator.Data_Validation/anomalies/4/train/anomalies.pbtxt'

In [21]:
context.show(example_validator.outputs['output'])

# Transform

In [22]:
TRANSFORM_MODULE = 'transform.py'
!cat {TRANSFORM_MODULE}
#!python transform.py

import tensorflow as tf
import tensorflow_transform as tft
import data_features

def _fill_in_missing(x):
  default_value = '' if x.dtype == tf.string else 0
  return tf.squeeze(tf.sparse.to_dense(tf.SparseTensor(x.indices, x.values, [x.dense_shape[0], 1]), default_value), axis=1)

def preprocessing_fn(inputs):
  outputs = {}

  # Scale numerical features.
  for key in data_features.NUMERIC_FEATURE_KEYS:
    outputs[data_features.transformed_feature_name(key)] = tft.scale_to_z_score(_fill_in_missing(inputs[key]))

  return outputs

In [23]:
transform = Transform(examples = example_gen.outputs['examples'],
                      schema = schema_gen.outputs['schema'],
                      module_file = TRANSFORM_MODULE)                      

In [24]:
example_gen.outputs['examples']

0,1
.type_name,Examples
._artifacts,"[0] function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Examples' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1) at 0x7fd57c178100.type<class 'tfx.types.standard_artifacts.Examples'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1.span0.split_names[""train_data"", ""test_data""].version0"

0,1
[0],"function toggleTfxObject(element) {  var objElement = element.parentElement;  if (objElement.classList.contains('collapsed')) {  objElement.classList.remove('collapsed');  objElement.classList.add('expanded');  } else {  objElement.classList.add('collapsed');  objElement.classList.remove('expanded');  } } Artifact of type 'Examples' (uri: /Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1) at 0x7fd57c178100.type<class 'tfx.types.standard_artifacts.Examples'>.uri/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1.span0.split_names[""train_data"", ""test_data""].version0"

0,1
.type,<class 'tfx.types.standard_artifacts.Examples'>
.uri,/Users/CarlosMonsivais/Desktop/TFX_football_manager_2022/Artifacts/tfx-football-pipeline/20220123_154422/CsvExampleGen/examples/1
.span,0
.split_names,"[""train_data"", ""test_data""]"
.version,0


In [25]:
context.run(transform)

ValueError: Split does not exist over all example artifacts: train