In [1]:
from misc.preferences import PREFERENCES
from misc.run_configuration import good_germeval_params, default_params, OutputLayerType
from misc.experimental_environment import Experiment
import time
from data.germeval2017 import germeval2017_dataset as dsl
import pprint
from misc import utils
import pandas as pd
import os

STATUS_FAIL = 'fail'
STATUS_OK = 'ok'

In [2]:
PREFERENCES.defaults(
        data_root='./data/data/germeval2017',
        data_train='train_v1.4.tsv',    
        data_validation='dev_v1.4.tsv',
        data_test='test_TIMESTAMP1.tsv',
        source_index=0,
        target_vocab_index=2,
        file_format='csv',
        language='de'
    )
main_experiment_name = 'GermEval-2017_Experiment'
use_cuda = True

In [3]:
baseline = good_germeval_params
print(pprint.pformat(baseline, indent=2))

{ 'att_d_k': 60,
  'att_d_v': 60,
  'batch_size': 26,
  'clip_comments_to': 230,
  'dropout_rate': 0.3116352148277839,
  'early_stopping': 10,
  'embedding_dim': 300,
  'embedding_name': '6B',
  'embedding_type': 'fasttext',
  'language': 'de',
  'learning_rate_scheduler': { 'noam_learning_rate_factor': 1.120962889284992,
                               'noam_learning_rate_warmup': 6706},
  'learning_rate_scheduler_type': <LearningSchedulerType.Noam: 1>,
  'log_every_xth_iteration': -1,
  'model_size': 300,
  'num_encoder_blocks': 6,
  'num_epochs': 35,
  'num_heads': 5,
  'optimizer': { 'adam_beta1': 0.8278419040185792,
                 'adam_beta2': 0.7523040247084006,
                 'adam_eps': 0.001028230097476593,
                 'adam_weight_decay': 0.0001,
                 'learning_rate': 0.09624249687454951},
  'optimizer_type': <OptimizerType.Adam: 1>,
  'output_conv_kernel_size': 5,
  'output_conv_num_filters': 117,
  'output_conv_padding': 0,
  'output_conv_stride': 9,
  

In [4]:
experiments = [
    {
        'name': 'Baseline - LM-H',
        'description': 'Baseline classification for the GermEval-2017 task using the linear mean head',
        'loss': 1000,
        'f1': -1,
        'rc': {
            'task': 'germeval'
        }
    },
    {
        'name': 'Baseline - CNN-H',
        'description': 'Baseline classification for the GermEval-2017 task using the cnn head',
        'loss': 1000,
        'f1': -1,
        'rc': {
            'task': 'germeval',
            'output_layer_type': OutputLayerType.Convolutions
        }
    },
    {
        'name': 'Attributes',
        'description': 'Classification of only attributes',
        'loss': 1000,
        'f1': -1,
        'rc': {
            'task': 'germeval_multitask'
        }
    }
]

In [5]:
utils.get_current_git_commit()
print('Current commit: ' + utils.get_current_git_commit())

Current commit: b'04962a6'


In [6]:
for e in experiments:
    name = e['name']
    print(f'#########################################################################\n\nExperiment Name: {name}\n')
    print('#########################################################################\n\n')
    test_params = {**baseline, **{'num_epochs': 35, 'language': 'de'}}
    test_params = {**test_params, **e['rc']}
    e = Experiment(main_experiment_name, e['description'], default_params, test_params, dsl, runs=5)
    df, e_path = e.run()



#########################################################################

Experiment Name: Baseline - LM-H

#########################################################################


Experiment GermEval-2017_Experiment initialized
Log path is  C:\Users\felix\OneDrive\Studium\Studium\6. Semester\MA\Project\ABSA-Transformer\logs\GermEval-2017_Experiment\20190501\0
Log path is  C:\Users\felix\OneDrive\Studium\Studium\6. Semester\MA\Project\ABSA-Transformer\logs\GermEval-2017_Experiment\20190501\1


#########################################################################
Name: GermEval-2017_Experiment
Description: Baseline classification for the GermEval-2017 task using the linear mean head
#########################################################################


+----------------------------------------------------------------------------------+
|                                 Hyperparameters                                  |
+------------------------------+-----------------------

                                          

+-------------------------+
|  GERM EVAL 2017 DATASET |
+---------------+---------+
|     Split     |   Size  |
+---------------+---------+
|     train     |  17043  |
|   validation  |   2049  |
|      test     |   2095  |
+---------------+---------+
+--------------------------------------+
|           Vocabulary Stats           |
+------------------------------+-------+
|          Vocabulary          |  Size |
+------------------------------+-------+
|              id              | 21187 |
|           comments           | 70418 |
|      general_sentiments      |   3   |
|      aspect_sentiments       |   4   |
|           padding            | 25733 |
|          Allgemein           |   4   |
|          Atmosphäre          |   4   |
| Auslastung_und_Platzangebot  |   4   |
|       Barrierefreiheit       |   4   |
|         Connectivity         |   4   |
|      DB_App_und_Website      |   4   |
|            Design            |   4   |
|   Gastronomisches_Angebot    |   4   |
|         


+-------------------------------------------------------------+
|                            Train                            |
+------------------------------+------+-------+-------+-------+
|           Category           | POS  |  NEG  |  NEU  |  Sum  |
+------------------------------+------+-------+-------+-------+
|          Allgemein           | 1102 |  2149 | 10043 | 13294 |
|           Zugfahrt           | 464  |  1813 |  173  |  2450 |
| Service_und_Kundenbetreuung  | 146  |  389  |   50  |  585  |
| Sonstige_Unregelmässigkeiten |  66  |  1936 |  107  |  2109 |
|          Sicherheit          |  21  |  903  |   15  |  939  |
|         Connectivity         |  75  |  240  |   67  |  382  |
|        Informationen         |  44  |  282  |   69  |  395  |
|          Atmosphäre          | 142  |  1165 |  223  |  1530 |
|          Ticketkauf          | 109  |  517  |  119  |  745  |
| Auslastung_und_Platzangebot  |  47  |  246  |   9   |  302  |
|   Komfort_und_Ausstattung    |  47  |


pre_training - DEBUG - train with cuda support
pre_training - INFO - 656 Iterations per epoch with batch size of 26
pre_training - INFO - Total iterations: 22960
pre_training - INFO - Total number of samples: 596960
pre_training - INFO - START training.


A Jupyter Widget

# EP	# IT	tr loss		val loss	f1		acc		duration / total time
1	17k	0.53		0.38		0.218		0.870		4.80m - 4.8m / 0.0m
2	34k	0.38		0.33		0.308		0.917		4.34m - 9.2m / 167.9m
3	51k	0.36		0.33		0.308		0.916		4.36m - 13.6m / 152.6m
4	68k	0.35		0.36		0.294		0.912		4.33m - 17.9m / 153.1m
5	85k	0.35		0.35		0.342		0.930		4.33m - 22.3m / 152.3m
6	102k	0.35		0.37		0.276		0.901		4.36m - 26.6m / 152.2m
7	119k	0.36		0.36		0.281		0.904		4.34m - 31.0m / 153.1m
8	136k	0.35		0.37		0.358		0.937		4.22m - 35.2m / 152.4m
9	154k	0.35		0.38		0.244		0.906		4.20m - 39.5m / 149.3m
10	171k	0.35		0.38		0.345		0.933		4.21m - 43.7m / 148.8m
11	188k	0.34		0.39		0.348		0.934		4.21m - 47.9m / 149.0m
12	205k	0.32		0.40		0.355		0.937		4.22m - 52.2m / 149.1m
13	222k	0.30		0.37		0.398		0.949		4.20m - 56.4m / 149.3m
14	239k	0.29		0.38		0.400		0.948		4.22m - 60.6m / 148.9m
15	256k	0.27		0.40		0.406		0.950		4.21m - 64.9m / 149.2m
16	273k	0.26		0.49		0.442		0.956		4.21m - 69.1m / 149.1m
17	290k	0.25		0.46		0.377		0.942		4.21m - 73.3m

                                          

+-------------------------+
|  GERM EVAL 2017 DATASET |
+---------------+---------+
|     Split     |   Size  |
+---------------+---------+
|     train     |  17043  |
|   validation  |   2049  |
|      test     |   2095  |
+---------------+---------+
+--------------------------------------+
|           Vocabulary Stats           |
+------------------------------+-------+
|          Vocabulary          |  Size |
+------------------------------+-------+
|              id              | 21187 |
|           comments           | 70418 |
|      general_sentiments      |   3   |
|      aspect_sentiments       |   4   |
|           padding            | 25733 |
|          Allgemein           |   4   |
|          Atmosphäre          |   4   |
| Auslastung_und_Platzangebot  |   4   |
|       Barrierefreiheit       |   4   |
|         Connectivity         |   4   |
|      DB_App_und_Website      |   4   |
|            Design            |   4   |
|   Gastronomisches_Angebot    |   4   |
|         


+-------------------------------------------------------------+
|                            Train                            |
+------------------------------+------+-------+-------+-------+
|           Category           | POS  |  NEG  |  NEU  |  Sum  |
+------------------------------+------+-------+-------+-------+
|          Allgemein           | 1102 |  2149 | 10043 | 13294 |
|           Zugfahrt           | 464  |  1813 |  173  |  2450 |
| Service_und_Kundenbetreuung  | 146  |  389  |   50  |  585  |
| Sonstige_Unregelmässigkeiten |  66  |  1936 |  107  |  2109 |
|          Sicherheit          |  21  |  903  |   15  |  939  |
|         Connectivity         |  75  |  240  |   67  |  382  |
|        Informationen         |  44  |  282  |   69  |  395  |
|          Atmosphäre          | 142  |  1165 |  223  |  1530 |
|          Ticketkauf          | 109  |  517  |  119  |  745  |
| Auslastung_und_Platzangebot  |  47  |  246  |   9   |  302  |
|   Komfort_und_Ausstattung    |  47  |


pre_training - DEBUG - train with cuda support
pre_training - INFO - 656 Iterations per epoch with batch size of 26
pre_training - INFO - Total iterations: 22960
pre_training - INFO - Total number of samples: 596960
pre_training - INFO - START training.


A Jupyter Widget

# EP	# IT	tr loss		val loss	f1		acc		duration / total time
1	17k	0.53		0.36		0.300		0.913		4.19m - 4.2m / 0.0m
2	34k	0.37		0.34		0.293		0.908		4.19m - 8.4m / 146.8m
3	51k	0.36		0.33		0.348		0.932		4.22m - 12.7m / 146.7m
4	68k	0.35		0.33		0.277		0.901		4.20m - 16.9m / 147.6m
5	85k	0.35		0.36		0.298		0.911		4.21m - 21.1m / 146.9m
6	102k	0.35		0.37		0.357		0.936		4.20m - 25.3m / 147.3m
7	119k	0.35		0.37		0.239		0.885		4.20m - 29.6m / 147.1m
8	136k	0.35		0.36		0.373		0.939		4.20m - 33.8m / 147.0m
9	154k	0.35		0.39		0.245		0.899		4.20m - 38.0m / 147.1m
10	171k	0.34		0.37		0.358		0.938		4.22m - 42.2m / 147.3m
11	188k	0.33		0.35		0.307		0.920		4.20m - 46.4m / 147.9m
12	205k	0.31		0.38		0.337		0.932		4.20m - 50.7m / 147.2m
13	222k	0.30		0.38		0.405		0.949		4.21m - 54.9m / 147.2m
14	239k	0.28		0.39		0.335		0.933		4.19m - 59.1m / 147.5m
15	256k	0.27		0.42		0.399		0.949		4.19m - 63.3m / 147.0m
16	273k	0.26		0.53		0.413		0.951		4.19m - 67.5m / 147.0m
17	290k	0.25		0.43		0.389		0.944		4.22m - 71.8m

                                          

+-------------------------+
|  GERM EVAL 2017 DATASET |
+---------------+---------+
|     Split     |   Size  |
+---------------+---------+
|     train     |  17043  |
|   validation  |   2049  |
|      test     |   2095  |
+---------------+---------+
+--------------------------------------+
|           Vocabulary Stats           |
+------------------------------+-------+
|          Vocabulary          |  Size |
+------------------------------+-------+
|              id              | 21187 |
|           comments           | 70418 |
|      general_sentiments      |   3   |
|      aspect_sentiments       |   4   |
|           padding            | 25733 |
|          Allgemein           |   4   |
|          Atmosphäre          |   4   |
| Auslastung_und_Platzangebot  |   4   |
|       Barrierefreiheit       |   4   |
|         Connectivity         |   4   |
|      DB_App_und_Website      |   4   |
|            Design            |   4   |
|   Gastronomisches_Angebot    |   4   |
|         


+-------------------------------------------------------------+
|                            Train                            |
+------------------------------+------+-------+-------+-------+
|           Category           | POS  |  NEG  |  NEU  |  Sum  |
+------------------------------+------+-------+-------+-------+
|          Allgemein           | 1102 |  2149 | 10043 | 13294 |
|           Zugfahrt           | 464  |  1813 |  173  |  2450 |
| Service_und_Kundenbetreuung  | 146  |  389  |   50  |  585  |
| Sonstige_Unregelmässigkeiten |  66  |  1936 |  107  |  2109 |
|          Sicherheit          |  21  |  903  |   15  |  939  |
|         Connectivity         |  75  |  240  |   67  |  382  |
|        Informationen         |  44  |  282  |   69  |  395  |
|          Atmosphäre          | 142  |  1165 |  223  |  1530 |
|          Ticketkauf          | 109  |  517  |  119  |  745  |
| Auslastung_und_Platzangebot  |  47  |  246  |   9   |  302  |
|   Komfort_und_Ausstattung    |  47  |


pre_training - DEBUG - train with cuda support
pre_training - INFO - 656 Iterations per epoch with batch size of 26
pre_training - INFO - Total iterations: 22960
pre_training - INFO - Total number of samples: 596960
pre_training - INFO - START training.


A Jupyter Widget

# EP	# IT	tr loss		val loss	f1		acc		duration / total time
1	17k	0.53		0.37		0.267		0.896		4.19m - 4.2m / 0.0m
2	34k	0.37		0.34		0.293		0.912		4.23m - 8.5m / 146.7m
3	51k	0.35		0.32		0.334		0.928		4.20m - 12.7m / 148.0m
4	68k	0.35		0.35		0.273		0.903		4.22m - 16.9m / 147.0m
5	85k	0.35		0.34		0.289		0.908		4.21m - 21.2m / 147.7m
6	102k	0.35		0.34		0.349		0.932		4.21m - 25.4m / 147.6m
7	119k	0.35		0.37		0.244		0.887		4.21m - 29.6m / 147.6m
8	136k	0.35		0.40		0.350		0.934		4.21m - 33.8m / 147.5m
9	154k	0.35		0.37		0.271		0.912		4.23m - 38.1m / 147.6m
10	171k	0.34		0.35		0.319		0.922		4.32m - 42.5m / 148.2m
11	188k	0.34		0.37		0.294		0.914		4.23m - 46.7m / 150.5m
12	205k	0.31		0.35		0.360		0.938		4.22m - 50.9m / 148.3m
13	222k	0.29		0.38		0.392		0.948		4.21m - 55.2m / 148.0m
14	239k	0.28		0.40		0.399		0.948		4.22m - 59.4m / 147.8m
15	256k	0.27		0.43		0.330		0.936		4.31m - 63.8m / 148.1m
16	273k	0.26		0.44		0.383		0.945		4.22m - 68.0m / 150.0m
17	290k	0.24		0.49		0.399		0.948		4.25m - 72.3m

                                          

+-------------------------+
|  GERM EVAL 2017 DATASET |
+---------------+---------+
|     Split     |   Size  |
+---------------+---------+
|     train     |  17043  |
|   validation  |   2049  |
|      test     |   2095  |
+---------------+---------+
+--------------------------------------+
|           Vocabulary Stats           |
+------------------------------+-------+
|          Vocabulary          |  Size |
+------------------------------+-------+
|              id              | 21187 |
|           comments           | 70418 |
|      general_sentiments      |   3   |
|      aspect_sentiments       |   4   |
|           padding            | 25733 |
|          Allgemein           |   4   |
|          Atmosphäre          |   4   |
| Auslastung_und_Platzangebot  |   4   |
|       Barrierefreiheit       |   4   |
|         Connectivity         |   4   |
|      DB_App_und_Website      |   4   |
|            Design            |   4   |
|   Gastronomisches_Angebot    |   4   |
|         


+-------------------------------------------------------------+
|                            Train                            |
+------------------------------+------+-------+-------+-------+
|           Category           | POS  |  NEG  |  NEU  |  Sum  |
+------------------------------+------+-------+-------+-------+
|          Allgemein           | 1102 |  2149 | 10043 | 13294 |
|           Zugfahrt           | 464  |  1813 |  173  |  2450 |
| Service_und_Kundenbetreuung  | 146  |  389  |   50  |  585  |
| Sonstige_Unregelmässigkeiten |  66  |  1936 |  107  |  2109 |
|          Sicherheit          |  21  |  903  |   15  |  939  |
|         Connectivity         |  75  |  240  |   67  |  382  |
|        Informationen         |  44  |  282  |   69  |  395  |
|          Atmosphäre          | 142  |  1165 |  223  |  1530 |
|          Ticketkauf          | 109  |  517  |  119  |  745  |
| Auslastung_und_Platzangebot  |  47  |  246  |   9   |  302  |
|   Komfort_und_Ausstattung    |  47  |


pre_training - DEBUG - train with cuda support
pre_training - INFO - 656 Iterations per epoch with batch size of 26
pre_training - INFO - Total iterations: 22960
pre_training - INFO - Total number of samples: 596960
pre_training - INFO - START training.


A Jupyter Widget

# EP	# IT	tr loss		val loss	f1		acc		duration / total time
1	17k	0.52		0.36		0.260		0.893		4.38m - 4.4m / 0.0m
2	34k	0.38		0.35		0.300		0.914		4.36m - 8.8m / 153.4m
3	51k	0.36		0.33		0.307		0.917		4.50m - 13.3m / 152.6m
4	68k	0.35		0.35		0.260		0.894		4.44m - 17.8m / 157.3m
5	85k	0.35		0.34		0.301		0.913		4.43m - 22.2m / 155.4m
6	102k	0.35		0.38		0.335		0.926		4.39m - 26.6m / 155.2m
7	119k	0.36		0.37		0.251		0.891		4.34m - 31.0m / 154.0m
8	136k	0.35		0.40		0.294		0.917		4.36m - 35.4m / 152.7m
9	154k	0.35		0.37		0.265		0.908		4.36m - 39.8m / 153.2m
10	171k	0.35		0.35		0.338		0.932		4.32m - 44.1m / 153.1m
11	188k	0.34		0.36		0.300		0.913		4.32m - 48.5m / 152.1m
12	205k	0.33		0.35		0.369		0.939		4.31m - 52.8m / 152.1m
13	222k	0.31		0.36		0.371		0.941		4.31m - 57.1m / 151.9m
14	239k	0.29		0.40		0.360		0.938		4.31m - 61.5m / 152.0m
15	256k	0.28		0.45		0.348		0.935		4.33m - 65.8m / 152.0m
16	273k	0.27		0.44		0.416		0.951		4.31m - 70.1m / 152.4m
17	290k	0.25		0.41		0.410		0.950		4.32m - 74.5m

                                          

+-------------------------+
|  GERM EVAL 2017 DATASET |
+---------------+---------+
|     Split     |   Size  |
+---------------+---------+
|     train     |  17043  |
|   validation  |   2049  |
|      test     |   2095  |
+---------------+---------+
+--------------------------------------+
|           Vocabulary Stats           |
+------------------------------+-------+
|          Vocabulary          |  Size |
+------------------------------+-------+
|              id              | 21187 |
|           comments           | 70418 |
|      general_sentiments      |   3   |
|      aspect_sentiments       |   4   |
|           padding            | 25733 |
|          Allgemein           |   4   |
|          Atmosphäre          |   4   |
| Auslastung_und_Platzangebot  |   4   |
|       Barrierefreiheit       |   4   |
|         Connectivity         |   4   |
|      DB_App_und_Website      |   4   |
|            Design            |   4   |
|   Gastronomisches_Angebot    |   4   |
|         


+-------------------------------------------------------------+
|                            Train                            |
+------------------------------+------+-------+-------+-------+
|           Category           | POS  |  NEG  |  NEU  |  Sum  |
+------------------------------+------+-------+-------+-------+
|          Allgemein           | 1102 |  2149 | 10043 | 13294 |
|           Zugfahrt           | 464  |  1813 |  173  |  2450 |
| Service_und_Kundenbetreuung  | 146  |  389  |   50  |  585  |
| Sonstige_Unregelmässigkeiten |  66  |  1936 |  107  |  2109 |
|          Sicherheit          |  21  |  903  |   15  |  939  |
|         Connectivity         |  75  |  240  |   67  |  382  |
|        Informationen         |  44  |  282  |   69  |  395  |
|          Atmosphäre          | 142  |  1165 |  223  |  1530 |
|          Ticketkauf          | 109  |  517  |  119  |  745  |
| Auslastung_und_Platzangebot  |  47  |  246  |   9   |  302  |
|   Komfort_und_Ausstattung    |  47  |


pre_training - DEBUG - train with cuda support
pre_training - INFO - 656 Iterations per epoch with batch size of 26
pre_training - INFO - Total iterations: 22960
pre_training - INFO - Total number of samples: 596960
pre_training - INFO - START training.


A Jupyter Widget

# EP	# IT	tr loss		val loss	f1		acc		duration / total time
1	17k	0.50		0.36		0.301		0.914		4.21m - 4.2m / 0.0m
2	34k	0.37		0.35		0.284		0.908		4.22m - 8.5m / 147.4m
3	51k	0.36		0.33		0.337		0.928		4.22m - 12.7m / 147.9m
4	68k	0.35		0.35		0.232		0.890		4.22m - 17.0m / 147.8m
5	85k	0.35		0.34		0.299		0.913		4.22m - 21.2m / 147.7m
6	102k	0.35		0.34		0.293		0.911		4.23m - 25.4m / 147.9m
7	119k	0.35		0.39		0.222		0.871		4.33m - 29.8m / 148.1m
8	136k	0.35		0.38		0.320		0.926		4.25m - 34.0m / 151.1m
9	154k	0.35		0.37		0.303		0.921		4.40m - 38.5m / 148.8m
10	171k	0.35		0.36		0.343		0.934		4.24m - 42.7m / 152.9m
11	188k	0.34		0.36		0.284		0.910		4.33m - 47.1m / 148.7m
12	205k	0.32		0.34		0.355		0.937		4.34m - 51.4m / 151.1m
13	222k	0.30		0.38		0.406		0.950		4.32m - 55.8m / 151.3m
14	239k	0.29		0.39		0.364		0.938		4.34m - 60.2m / 150.8m
15	256k	0.28		0.39		0.344		0.935		4.47m - 64.6m / 151.4m
16	273k	0.26		0.46		0.380		0.944		4.41m - 69.1m / 154.0m
17	290k	0.25		0.42		0.416		0.951		4.77m - 73.9m

+------------------------------+---------------------------------------------------+


                                          

+-------------------------+
|  GERM EVAL 2017 DATASET |
+---------------+---------+
|     Split     |   Size  |
+---------------+---------+
|     train     |  17043  |
|   validation  |   2049  |
|      test     |   2095  |
+---------------+---------+
+--------------------------------------+
|           Vocabulary Stats           |
+------------------------------+-------+
|          Vocabulary          |  Size |
+------------------------------+-------+
|              id              | 21187 |
|           comments           | 70418 |
|      general_sentiments      |   3   |
|      aspect_sentiments       |   4   |
|           padding            | 25733 |
|          Allgemein           |   4   |
|          Atmosphäre          |   4   |
| Auslastung_und_Platzangebot  |   4   |
|       Barrierefreiheit       |   4   |
|         Connectivity         |   4   |
|      DB_App_und_Website      |   4   |
|            Design            |   4   |
|   Gastronomisches_Angebot    |   4   |
|         


+-------------------------------------------------------------+
|                            Train                            |
+------------------------------+------+-------+-------+-------+
|           Category           | POS  |  NEG  |  NEU  |  Sum  |
+------------------------------+------+-------+-------+-------+
|          Allgemein           | 1102 |  2149 | 10043 | 13294 |
|           Zugfahrt           | 464  |  1813 |  173  |  2450 |
| Service_und_Kundenbetreuung  | 146  |  389  |   50  |  585  |
| Sonstige_Unregelmässigkeiten |  66  |  1936 |  107  |  2109 |
|          Sicherheit          |  21  |  903  |   15  |  939  |
|         Connectivity         |  75  |  240  |   67  |  382  |
|        Informationen         |  44  |  282  |   69  |  395  |
|          Atmosphäre          | 142  |  1165 |  223  |  1530 |
|          Ticketkauf          | 109  |  517  |  119  |  745  |
| Auslastung_und_Platzangebot  |  47  |  246  |   9   |  302  |
|   Komfort_und_Ausstattung    |  47  |


pre_training - DEBUG - train with cuda support
pre_training - INFO - 656 Iterations per epoch with batch size of 26
pre_training - INFO - Total iterations: 22960
pre_training - INFO - Total number of samples: 596960
pre_training - INFO - START training.


A Jupyter Widget

# EP	# IT	tr loss		val loss	f1		acc		duration / total time
1	17k	0.48		0.41		0.253		0.893		6.73m - 6.7m / 0.0m
2	34k	0.44		0.44		0.145		0.843		6.85m - 13.6m / 235.5m
3	51k	0.50		0.59		0.130		0.738		6.81m - 20.4m / 239.6m


KeyboardInterrupt: 

In [None]:
p = os.path.join(e_path, 'exp_df.pkl')
print('Save dataframe of experiment to ' + p)
df.to_pickle(p)

# Test set 2

In [5]:
PREFERENCES.defaults(
        data_root='./data/data/germeval2017',
        data_train='train_v1.4.tsv',    
        data_validation='dev_v1.4.tsv',
        data_test='test_TIMESTAMP2.tsv',
        source_index=0,
        target_vocab_index=2,
        file_format='csv',
        language='de'
    )

In [9]:
for e in [experiments[0]]:
    name = e['name']
    print(f'#########################################################################\n\nExperiment Name: {name}\n')
    print('#########################################################################\n\n')
    test_params = {**baseline, **{'num_epochs': 35, 'language': 'de'}}
    test_params = {**test_params, **e['rc']}
    e = Experiment(main_experiment_name, e['description'], default_params, test_params, dsl, runs=5)
    df, e_path = e.run()

#########################################################################

Experiment Name: Baseline - LM-H

#########################################################################


Experiment GermEval-2017_Experiment initialized
Log path is  C:\Users\felix\OneDrive\Studium\Studium\6. Semester\MA\Project\ABSA-Transformer\logs\GermEval-2017_Experiment\20190501\12
Log path is  C:\Users\felix\OneDrive\Studium\Studium\6. Semester\MA\Project\ABSA-Transformer\logs\GermEval-2017_Experiment\20190501\13


#########################################################################
Name: GermEval-2017_Experiment
Description: Baseline classification for the GermEval-2017 task using the linear mean head
#########################################################################


+----------------------------------------------------------------------------------+
|                                 Hyperparameters                                  |
+------------------------------+---------------------


Load train_v: 0it [00:00, ?it/s]
Load train_v: 370it [00:00, 3699.30it/s]
Load train_v: 787it [00:00, 3828.95it/s]
Load train_v: 1302it [00:00, 4128.55it/s]
Load train_v: 1686it [00:00, 4024.87it/s]
Load train_v: 2151it [00:00, 4194.01it/s]
Load train_v: 2621it [00:00, 4322.03it/s]
Load train_v: 3158it [00:00, 4590.45it/s]
Load train_v: 3595it [00:00, 4466.97it/s]
Load train_v: 4044it [00:00, 4407.55it/s]
Load train_v: 4525it [00:01, 4373.02it/s]
Load train_v: 4989it [00:01, 4437.07it/s]
Load train_v: 5473it [00:01, 4537.95it/s]
Load train_v: 5974it [00:01, 4657.03it/s]
Load train_v: 6456it [00:01, 4691.37it/s]
Load train_v: 6925it [00:01, 4387.65it/s]
Load train_v: 7389it [00:01, 4409.61it/s]
Load train_v: 7833it [00:01, 4217.20it/s]
Load train_v: 8260it [00:01, 4207.91it/s]
Load train_v: 8762it [00:01, 4410.90it/s]
Load train_v: 9374it [00:02, 4803.26it/s]
Load train_v: 9868it [00:02, 4759.48it/s]
Load train_v: 10372it [00:02, 4839.87it/s]
Load train_v: 10863it [00:02, 4720.93it/s]


+-------------------------+
|  GERM EVAL 2017 DATASET |
+---------------+---------+
|     Split     |   Size  |
+---------------+---------+
|     train     |  17043  |
|   validation  |   2049  |
|      test     |   1547  |
+---------------+---------+
+--------------------------------------+
|           Vocabulary Stats           |
+------------------------------+-------+
|          Vocabulary          |  Size |
+------------------------------+-------+
|              id              | 20639 |
|           comments           | 69247 |
|      general_sentiments      |   3   |
|      aspect_sentiments       |   4   |
|           padding            | 22936 |
|          Allgemein           |   4   |
|          Atmosphäre          |   4   |
| Auslastung_und_Platzangebot  |   4   |
|       Barrierefreiheit       |   4   |
|         Connectivity         |   4   |
|      DB_App_und_Website      |   4   |
|            Design            |   4   |
|   Gastronomisches_Angebot    |   4   |
|         


+-------------------------------------------------------------+
|                            Train                            |
+------------------------------+------+-------+-------+-------+
|           Category           | POS  |  NEG  |  NEU  |  Sum  |
+------------------------------+------+-------+-------+-------+
|          Allgemein           | 1102 |  2149 | 10043 | 13294 |
|           Zugfahrt           | 464  |  1813 |  173  |  2450 |
| Service_und_Kundenbetreuung  | 146  |  389  |   50  |  585  |
| Sonstige_Unregelmässigkeiten |  66  |  1936 |  107  |  2109 |
|          Sicherheit          |  21  |  903  |   15  |  939  |
|         Connectivity         |  75  |  240  |   67  |  382  |
|        Informationen         |  44  |  282  |   69  |  395  |
|          Atmosphäre          | 142  |  1165 |  223  |  1530 |
|          Ticketkauf          | 109  |  517  |  119  |  745  |
| Auslastung_und_Platzangebot  |  47  |  246  |   9   |  302  |
|   Komfort_und_Ausstattung    |  47  |


pre_training - DEBUG - train with cuda support
pre_training - INFO - 656 Iterations per epoch with batch size of 26
pre_training - INFO - Total iterations: 22960
pre_training - INFO - Total number of samples: 596960
pre_training - INFO - START training.


A Jupyter Widget

                                          

# EP	# IT	tr loss		val loss	f1		acc		duration / total time


                                          

1	17k	0.53		0.39		0.337		0.931		4.61m - 4.6m / 0.0m


                                          

2	34k	0.38		0.36		0.255		0.894		4.64m - 9.4m / 161.6m


                                          

3	51k	0.35		0.36		0.293		0.911		4.61m - 14.0m / 162.4m


                                          

4	68k	0.35		0.36		0.235		0.889		4.62m - 18.6m / 161.4m


                                          

5	85k	0.35		0.36		0.276		0.901		4.62m - 23.2m / 161.8m


                                          

6	102k	0.35		0.37		0.295		0.913		4.61m - 27.9m / 161.9m


                                          

7	119k	0.35		0.35		0.347		0.930		4.59m - 32.5m / 161.6m


                                          

8	136k	0.35		0.35		0.290		0.911		4.59m - 37.1m / 161.0m


                                          

9	154k	0.35		0.36		0.297		0.914		4.59m - 41.7m / 161.0m


                                          

10	171k	0.34		0.45		0.386		0.950		4.58m - 46.3m / 161.0m


                                          

11	188k	0.34		0.35		0.407		0.953		4.60m - 50.9m / 160.8m


                                          

12	205k	0.32		0.47		0.395		0.949		4.58m - 55.5m / 161.4m


                                            

13	222k	0.30		0.38		0.363		0.937		4.59m - 60.1m / 161.0m


                                            

14	239k	0.28		0.43		0.356		0.936		4.59m - 64.7m / 161.2m


                                            

15	256k	0.27		0.40		0.389		0.947		4.59m - 69.3m / 161.2m


                                            

16	273k	0.26		0.46		0.420		0.952		4.59m - 73.9m / 161.1m


                                            

17	290k	0.25		0.51		0.441		0.955		4.58m - 78.6m / 161.1m


                                            

18	307k	0.24		0.44		0.397		0.947		4.60m - 83.3m / 161.2m


                                            

19	324k	0.23		0.46		0.411		0.951		4.59m - 87.8m / 161.4m


                                            

20	341k	0.22		0.57		0.416		0.955		4.58m - 92.4m / 161.2m


                                            

21	358k	0.22		0.69		0.406		0.951		4.58m - 97.0m / 161.1m


                                            

22	375k	0.21		0.69		0.431		0.957		4.58m - 101.6m / 161.2m


                                            

23	392k	0.20		0.65		0.432		0.956		4.58m - 106.2m / 161.2m


                                            

24	409k	0.20		0.58		0.426		0.957		4.59m - 110.8m / 161.2m


                                            

25	426k	0.19		0.75		0.467		0.962		4.59m - 115.4m / 161.3m


                                            

26	443k	0.19		0.68		0.448		0.959		4.58m - 120.0m / 161.3m


                                            

27	461k	0.18		0.64		0.419		0.954		4.58m - 124.6m / 161.3m


                                            

28	478k	0.18		0.62		0.425		0.956		4.57m - 129.2m / 161.3m


                                            

29	495k	0.17		0.60		0.421		0.955		4.58m - 133.8m / 161.2m


                                            

30	512k	0.17		0.58		0.403		0.950		4.58m - 138.4m / 161.3m


                                            

31	529k	0.16		0.50		0.397		0.949		4.58m - 143.0m / 161.3m


                                            

32	546k	0.16		0.59		0.439		0.958		4.58m - 147.6m / 161.3m


                                            

33	563k	0.16		0.60		0.412		0.954		4.58m - 152.2m / 161.3m


                                            

34	580k	0.16		0.55		0.412		0.953		4.58m - 156.8m / 161.3m


                                            

35	597k	0.15		0.64		0.459		0.962		4.58m - 161.4m / 161.4m


Load train_v: 13626it [2:49:11, 4287.69it/s]

Training duration was 9685.623672962189
pre_training - DEBUG - --- Valid Scores ---
pre_training - INFO - TEST MACRO mean f1: 0.11126918130285399
VAL f1	0.46694711538461536 - (0.46694711538461536)
(macro) f1	{'valid': 0.14882394133828408, 'test': 0.11126918130285399}
VAL loss	0.3490273736584152
.---.
 /     \
 \.@-@./		Experiment: [0/1]
 /`\_/`\		Status: ok
 //  _  \\	Loss: 0.3490273736584152
 | \     )|_	f1: 0.46694711538461536
 /`\_`>  <_/ \
 \__/'---'\__/

#################################################################################
############################## EXPERIMENT COMPLETE ##############################


Run [0/1]: 0.4133184523809524
------------------------------
Mean: 0.4133184523809524
TEST MICRO F1 Statistics
count    1.000000
mean     0.413318
std           NaN
min      0.413318
25%      0.413318
50%      0.413318
75%      0.413318
max      0.413318
Name: test_f1, dtype: float64
TEST MACRO F1 Statistics
count    1.000000
mean     0.111269
std           NaN
min   