# Training

```bash
export BERT_BASE_DIR=/home/ubuntu/bert_models/uncased_L-12_H-768_A-12
export GLUE_DIR=/home/ubuntu/glue_data

python run_classifier.py \
  --task_name=ARD \
  --do_train=true \
  --do_eval=true \
  --data_dir=$GLUE_DIR/ARD \
  --vocab_file=$BERT_BASE_DIR/vocab.txt \
  --bert_config_file=$BERT_BASE_DIR/bert_config.json \
  --init_checkpoint=$BERT_BASE_DIR/bert_model.ckpt \
  --max_seq_length=128 \
  --train_batch_size=32 \
  --learning_rate=2e-5 \
  --num_train_epochs=3.0 \
  --output_dir=/home/ubuntu/tmp/ard_output/
 ```

# Prediction

```sh
export BERT_BASE_DIR=/home/ubuntu/bert_models/uncased_L-12_H-768_A-12
export GLUE_DIR=/home/ubuntu/glue_data
export TRAINED_CLASSIFIER=/home/ubuntu/tmp/ard_output

python run_classifier.py \
  --task_name=ARD \
  --do_predict=true \
  --data_dir=$GLUE_DIR/ARD \
  --vocab_file=$BERT_BASE_DIR/vocab.txt \
  --bert_config_file=$BERT_BASE_DIR/bert_config.json \
  --init_checkpoint=$TRAINED_CLASSIFIER \
  --max_seq_length=128 \
  --output_dir=/home/ubuntu/tmp/ard_output/
 ```

In [3]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
%matplotlib inline

  (fname, cnt))
  (fname, cnt))
  'Matplotlib is building the font cache using fc-list. '


In [8]:
test_predictions = pd.read_csv('/home/ubuntu/tmp/ard_output/test_results.tsv',delimiter='\t',header=None)

In [14]:
test_labels = pd.read_csv('/home/ubuntu/glue_data/ARD/test.tsv',delimiter='\t')

In [16]:
labels = test_labels.helpful_bin.values

In [38]:
from sklearn.metrics import accuracy_score, confusion_matrix, classification_report

In [33]:
accuracy = accuracy_score(y_pred=test_predictions.values.argmax(1),y_true=labels)

In [35]:
cmx = confusion_matrix(y_pred=test_predictions.values.argmax(1),y_true=labels)

In [40]:
print(classification_report(y_pred=test_predictions.values.argmax(1),y_true=labels))

              precision    recall  f1-score   support

           0       0.38      0.45      0.41       107
           1       0.21      0.13      0.16       113
           2       0.10      0.01      0.02        77
           3       0.06      0.02      0.03        60
           4       0.00      0.00      0.00        73
           5       0.00      0.00      0.00        91
           6       0.09      0.02      0.03       157
           7       0.10      0.02      0.04       421
           8       0.24      0.18      0.21       829
           9       0.50      0.88      0.64      1263

   micro avg       0.42      0.42      0.42      3191
   macro avg       0.17      0.17      0.15      3191
weighted avg       0.30      0.42      0.33      3191

