In [1]:
# Import Dependencies
import json
import numpy as np
from sklearn import datasets
from sklearn.model_selection import train_test_split

In [2]:
# Load digits dataset
iris = datasets.load_iris()

# Create feature matrix
X = iris.data

# Create target vector
y = iris.target

# View the first observation's feature values
X[0]

array([5.1, 3.5, 1.4, 0.2])

In [3]:
# Train Test Split
X_train, X_test, y_train, y_test = train_test_split(X, y, shuffle=True, random_state=101)

In [4]:
len(X_train), len(y_train)

(112, 112)

In [5]:
len(X_test), len(y_test)

(38, 38)

In [6]:
data = {}
data['data'] = []
for i in range(len(X_train)):
    data['data'].append({
        "sepal_length": X_train[i][0].item(),
        "sepal_width": X_train[i][1].item(),
        "petal_length": X_train[i][2].item(),
        "petal_width": X_train[i][3].item(),
        "species": y_train[i].item()
    })

In [7]:
data

{'data': [{'sepal_length': 5.6,
   'sepal_width': 2.7,
   'petal_length': 4.2,
   'petal_width': 1.3,
   'species': 1},
  {'sepal_length': 7.7,
   'sepal_width': 3.0,
   'petal_length': 6.1,
   'petal_width': 2.3,
   'species': 2},
  {'sepal_length': 5.1,
   'sepal_width': 3.7,
   'petal_length': 1.5,
   'petal_width': 0.4,
   'species': 0},
  {'sepal_length': 4.6,
   'sepal_width': 3.6,
   'petal_length': 1.0,
   'petal_width': 0.2,
   'species': 0},
  {'sepal_length': 4.7,
   'sepal_width': 3.2,
   'petal_length': 1.6,
   'petal_width': 0.2,
   'species': 0},
  {'sepal_length': 6.7,
   'sepal_width': 3.0,
   'petal_length': 5.0,
   'petal_width': 1.7,
   'species': 1},
  {'sepal_length': 5.6,
   'sepal_width': 3.0,
   'petal_length': 4.5,
   'petal_width': 1.5,
   'species': 1},
  {'sepal_length': 4.3,
   'sepal_width': 3.0,
   'petal_length': 1.1,
   'petal_width': 0.1,
   'species': 0},
  {'sepal_length': 7.1,
   'sepal_width': 3.0,
   'petal_length': 5.9,
   'petal_width': 2.1,
  

In [8]:
data['data'][0]

{'sepal_length': 5.6,
 'sepal_width': 2.7,
 'petal_length': 4.2,
 'petal_width': 1.3,
 'species': 1}

In [9]:
with open('training_data.json', 'w') as f:
    json.dump(data['data'], f)

In [10]:
test_data = {}
test_data['data'] = []
for i in range(len(X_test)):
    test_data['data'].append({
        "sepal_length": X_test[i][0].item(),
        "sepal_width": X_test[i][1].item(),
        "petal_length": X_test[i][2].item(),
        "petal_width": X_test[i][3].item(),
        "species": y_test[i].item()
    })

In [11]:
test_data

{'data': [{'sepal_length': 5.5,
   'sepal_width': 4.2,
   'petal_length': 1.4,
   'petal_width': 0.2,
   'species': 0},
  {'sepal_length': 5.4,
   'sepal_width': 3.9,
   'petal_length': 1.3,
   'petal_width': 0.4,
   'species': 0},
  {'sepal_length': 5.0,
   'sepal_width': 3.5,
   'petal_length': 1.6,
   'petal_width': 0.6,
   'species': 0},
  {'sepal_length': 7.2,
   'sepal_width': 3.0,
   'petal_length': 5.8,
   'petal_width': 1.6,
   'species': 2},
  {'sepal_length': 7.0,
   'sepal_width': 3.2,
   'petal_length': 4.7,
   'petal_width': 1.4,
   'species': 1},
  {'sepal_length': 6.3,
   'sepal_width': 2.7,
   'petal_length': 4.9,
   'petal_width': 1.8,
   'species': 2},
  {'sepal_length': 6.2,
   'sepal_width': 2.2,
   'petal_length': 4.5,
   'petal_width': 1.5,
   'species': 1},
  {'sepal_length': 5.5,
   'sepal_width': 2.3,
   'petal_length': 4.0,
   'petal_width': 1.3,
   'species': 1},
  {'sepal_length': 6.3,
   'sepal_width': 2.5,
   'petal_length': 5.0,
   'petal_width': 1.9,
  

In [12]:
with open('test_data.json', 'w') as f:
    json.dump(test_data['data'], f)