/
hparams
1 lines (1 loc) · 1.77 KB
/
hparams
1
{"src": "req", "tgt": "rep", "train_prefix": "./data/initial/train", "dev_prefix": "./data/initial/test", "test_prefix": "./data/initial/test", "vocab_prefix": "./data/initial/vocab", "embed_prefix": null, "out_dir": "./data/initial/model", "num_units": 128, "num_layers": 4, "num_encoder_layers": 4, "num_decoder_layers": 4, "dropout": 0.2, "unit_type": "lstm", "encoder_type": "uni", "residual": false, "time_major": true, "num_embeddings_partitions": 0, "attention": "scaled_luong", "attention_architecture": "standard", "output_attention": true, "pass_hidden_state": true, "optimizer": "sgd", "num_train_steps": 2000, "batch_size": 128, "init_op": "uniform", "init_weight": 0.1, "max_gradient_norm": 5.0, "learning_rate": 1.0, "warmup_steps": 0, "warmup_scheme": "t2t", "decay_scheme": "", "colocate_gradients_with_ops": true, "num_buckets": 5, "max_train": 0, "src_max_len": 50, "tgt_max_len": 50, "src_max_len_infer": null, "tgt_max_len_infer": null, "infer_batch_size": 32, "beam_width": 0, "length_penalty_weight": 0.0, "sampling_temperature": 0.0, "num_translations_per_input": 1, "sos": "<s>", "eos": "</s>", "subword_option": "", "check_special_token": true, "forget_bias": 1.0, "num_gpus": 1, "epoch_step": 0, "steps_per_stats": 100, "steps_per_external_eval": null, "share_vocab": false, "metrics": ["bleu"], "log_device_placement": false, "random_seed": null, "override_loaded_hparams": false, "num_keep_ckpts": 5, "avg_ckpts": false, "num_intra_threads": 0, "num_inter_threads": 0, "num_encoder_residual_layers": 0, "num_decoder_residual_layers": 0, "src_vocab_size": 22, "tgt_vocab_size": 27, "src_vocab_file": "./data/initial/vocab.req", "tgt_vocab_file": "./data/initial/vocab.rep", "src_embed_file": "", "tgt_embed_file": "", "best_bleu": 100.0, "best_bleu_dir": "./data/initial/model/best_bleu"}