{
  "training_data_path": "path/to/training_data",
  "eval_data_path": "path/to/eval/data",
  "state_norm_data_path": "path/to/norm_data",
  "model_output_path": "outputs/",
  "use_gpu": true,
  "use_all_avail_gpus": true,
  "num_nodes": 1,
  "init_method": "file:///tmp/dqn_example.lock",
  "norm_params": {
    "output_dir": "path/to/norm_data",
    "cols_to_norm": [
      "state_features"
    ],
    "num_samples": 10000,
    "skip_box_cox": false,
    "feature_overrides": {
      "0": "CONTINUOUS",
      "1": "CONTINUOUS",
      "2": "CONTINUOUS"
    }
  },
  "actions": [
    "3",
    "4",
    "5",
    "6",
    "7",
    "8",
    "9",
    "10",
    "11",
    "12",
    "13",
    "14",
    "15",
    "16",
    "17",
    "18",
    "19",
    "20",
    "21",
    "22",
    "23",
    "24",
    "25",
    "26",
    "27",
    "28",
    "29",
    "30",
    "31",
    "32",
    "33",
    "34",
    "35",
    "36",
    "37",
    "38",
    "39",
    "40",
    "41",
    "42",
    "43",
    "44",
    "45",
    "46",
    "47",
    "48",
    "49",
    "50",
    "51",
    "52",
    "53",
    "54",
    "55",
    "56",
    "57",
    "58",
    "59",
    "60",
    "61",
    "62",
    "63",
    "64",
    "65",
    "66",
    "67",
    "68",
    "69",
    "70",
    "71",
    "72",
    "73",
    "74",
    "75",
    "76",
    "77",
    "78",
    "79",
    "80",
    "81",
    "82",
    "83",
    "84",
    "85",
    "86",
    "87",
    "88",
    "89",
    "90",
    "91",
    "92",
    "93",
    "94",
    "95",
    "96",
    "97",
    "98",
    "99",
    "100",
    "101",
    "102"
  ],
  "epochs": 100,
  "rl": {
    "gamma": 0.99,
    "target_update_rate": 0.2,
    
    "maxq_learning": 1,
    "epsilon": 0.2,
    "temperature": 0.35,
    "softmax_policy": 0
  },
  "rainbow": {
    "double_q_learning": true,
    "dueling_architecture": false
  },
  "training": {
    "layers": [
      -1,
      128,
      64,
      -1
    ],
    "activations": [
      "relu",
      "relu",
      "linear"
    ],
    "minibatch_size": 256,
    "learning_rate": 0.001,
    "optimizer": "ADAM",
    "lr_decay": 0.999,
    "warm_start_model_path": null,
    "l2_decay": 0
  }
}