To run this notebook, you need to install tensorflow 1.9 and the skip-thoughts package

Please follow the steps below - 

1. Create a new environment with python version 3.7.1 and install tensorflow 1.9.0 on it 
2. Install the skip-thoughts package with 'pip install skip-thoughts'

After installation, you need to download the model zip files for skip-thought. Run the following commands to do so - 

1. wget "http://download.tensorflow.org/models/skip_thoughts_bi_2017_02_16.tar.gz"

2. tar -xvf skip_thoughts_bi_2017_02_16.tar.gz

3. rm skip_thoughts_bi_2017_02_16.tar.gz

Once this process has been completed, you can continue running the cells below. Change the location of files accordingly in the code below. 

In [None]:
# importing all necessary packages
from __future__ import absolute_import
from __future__ import division
from __future__ import print_function
import numpy as np
import os.path
import FeatureGenerator
import pandas as pd

In [None]:
train_dataset_loc = './Data/FinalTrainSet.csv'
test_dataset_loc = './Data/FinalTestSet.csv'

# Creating Neural Features for dataset

In [None]:
# Train Set
neural_features_train,labels_done_train = FeatureGenerator.neural_features(train_dataset_loc)
print(len(labels_done_train))
print(neural_features.train) # should be (len(labels_done_train),4800)

In [None]:
# Test Set
neural_features_test,labels_done_test = FeatureGenerator.neural_features(test_dataset_loc)
print(len(labels_done_test))
print(neural_features.test) # should be (len(labels_done_test),4800)

In [None]:
# Saving the neural features
np.save(arr=neural_features_train,file='./Data/english_train_neural.npy')
np.save(arr=neural_features_test,file='./Data/english_test_neural.npy')
np.save(arr=labels_done_train,file='./Data/labels_done_train.npy')
np.save(arr=labels_done_test,file = './Data/labels_done_test.npy')

# Creating Statistical Features for dataset

In [None]:
# Train Set
statistical_features_train = FeatureGenerator.statistical_features(dataset_loc = train_dataset_loc, labels_done = labels_done_train)
print(statistical_features_train.shape) # should be (len(labels_done_train),10000)

In [None]:
# Test Set
statistical_features_test = FeatureGenerator.statistical_features(dataset_loc = test_dataset_loc, labels_done = labels_done_test)
print(statistical_features_test.shape) # should be (len(labels_done_test),10000)

In [None]:
# Saving the statistical features
np.save(arr=statistical_features_train,file='./Data/english_train_statistical.npy')
np.save(arr=statistical_features_test,file='./Data/english_test_statistical.npy')

# Creating External Features for dataset

In [None]:
#Train set
external_features_train = FeatureGenerator.external_features(dataset_loc = train_dataset_loc, labels_done = labels_done_train)
print(external_features_train.shape) # should be (len(labels_done_train),21)

In [None]:
#Test set
external_features_test = FeatureGenerator.external_features(dataset_loc = test_dataset_loc, labels_done = labels_done_test)
print(external_features_test.shape) # should be (len(labels_done_test),21)

In [None]:
# Saving external features
np.save(arr=external_features_train,file = './Data/english_train_external.npy')
np.save(arr=external_features_test,file='./Data/english_test_external.npy')