In [None]:
# normalize

from pandas import Series
from sklearn.preprocessing import MinMaxScaler

# define contrived series
data = [10.0, 20.0, 30.0, 40.0, 50.0, 60.0, 70.0, 80.0, 90.0, 100.0]
series = Series(data)
print(series)

# prepare data for normalization
values = series.values
values = values.reshape((len(values), 1))

# train the normalization
scaler = MinMaxScaler(feature_range=(0, 1))
scaler = scaler.fit(values)
print('Min: %f, Max: %f' % (scaler.data_min_, scaler.data_max_))

# normalize the dataset and print
normalized = scaler.transform(values)
print(normalized)

# inverse transform and print
inversed = scaler.inverse_transform(normalized)
print(inversed)

In [None]:
# one-hot encode

from numpy import array
from numpy import argmax
from sklearn.preprocessing import LabelEncoder
from sklearn.preprocessing import OneHotEncoder

# define example
data = ['cold', 'cold', 'warm', 'cold', 'hot', 'hot', 'warm', 'cold', 'warm', 'hot']
values = array(data)
print(values)

# integer encode
label_encoder = LabelEncoder()
integer_encoded = label_encoder.fit_transform(values)
print(integer_encoded)

# binary encode
onehot_encoder = OneHotEncoder(sparse=False, categories='auto')
integer_encoded = integer_encoded.reshape(len(integer_encoded), 1)
onehot_encoded = onehot_encoder.fit_transform(integer_encoded)
print(onehot_encoded)

# invert first example
inverted = label_encoder.inverse_transform([argmax(onehot_encoded[0, :])])
print(inverted)

In [None]:
# post seq padding

from keras.preprocessing.sequence import pad_sequences

# define sequences
sequences = [
	[1, 2, 3, 4],
	   [1, 2, 3],
		     [1]
	]

# pad sequence
padded = pad_sequences(sequences, padding='post')
print(padded)

In [None]:
# post seq truncating

from keras.preprocessing.sequence import pad_sequences

# define sequences
sequences = [
	[1, 2, 3, 4],
	   [1, 2, 3],
		     [1]
	]

# truncate sequence
truncated= pad_sequences(sequences, maxlen=2, truncating='post')
print(truncated)

In [None]:
# pre seq padding

from keras.preprocessing.sequence import pad_sequences

# define sequences
sequences = [
	[1, 2, 3, 4],
	   [1, 2, 3],
		     [1]
	]

# pad sequence
padded = pad_sequences(sequences)
print(padded)

In [None]:
# pre seq truncating

from keras.preprocessing.sequence import pad_sequences

# define sequences
sequences = [
	[1, 2, 3, 4],
	   [1, 2, 3],
		     [1]
	]

# truncate sequence
truncated= pad_sequences(sequences, maxlen=2)
print(truncated)

In [None]:
# shift backward

from pandas import DataFrame

# define the sequence
df = DataFrame()
df['t'] = [x for x in range(10)]

# shift backward
df['t+1'] = df['t'].shift(-1)
print(df)

In [None]:
# shift forward

from pandas import DataFrame

# define the sequence
df = DataFrame()
df['t'] = [x for x in range(10)]

# shift forward
df['t-1'] = df['t'].shift(1)
print(df)

In [None]:
# shift sequence

from pandas import DataFrame

# define the sequence
df = DataFrame()
df['t'] = [x for x in range(10)]
print(df)

In [None]:
# standardize

from pandas import Series
from sklearn.preprocessing import StandardScaler
from math import sqrt

# define contrived series
data = [1.0, 5.5, 9.0, 2.6, 8.8, 3.0, 4.1, 7.9, 6.3]
series = Series(data)
print(series)

# prepare data for normalization
values = series.values
values = values.reshape((len(values), 1))

# train the normalization
scaler = StandardScaler()
scaler = scaler.fit(values)
print('Mean: %f, StandardDeviation: %f' % (scaler.mean_, sqrt(scaler.var_)))

# normalize the dataset and print
standardized = scaler.transform(values)
print(standardized)

# inverse transform and print
inversed = scaler.inverse_transform(standardized)
print(inversed)