Code and LaTeX source for the paper Generalization and Regularization in DQN .
The code used in all experiments can be located at JesseFarebro/dqn-ale. You can checkout the code by cloning this repository with recursive submodules and follow the instructions at the provided repository.
python3 main.py --rom {freeway.bin,hero.bin,space_invaders.bin,breakout.bin} \
--random_seed {0,1,2,3,4,5,6,7,8,9}
python3 main.py --rom {freeway.bin,hero.bin,space_invaders.bin,breakout.bin} \
--random_seed {0,1,2,3,4,5,6,7,8,9} \
--use_dropout \
--use_l2
python3 main.py --rom {freeway.bin,hero.bin,space_invaders.bin,breakout.bin} \
--random_seed {0,1,2,3,4,5,6,7,8,9} \
--evaluate \
--max_episode_count 100 \
--restore_dir {logdir,logdir_with_reg}
python3 main.py --rom {freeway.bin,hero.bin,space_invaders.bin,breakout.bin} \
--random_seed {0,1,2,3,4,5,6,7,8,9} \
--restore_dir {logdir,logdir_with_reg} \
--mode M --difficulty D
python3 main.py --rom {freeway.bin,hero.bin,space_invaders.bin,breakout.bin} \
--random_seed {0,1,2,3,4,5,6,7,8,9} \
--restore_dir {logdir, logdir_with_reg} \
--mode M --difficulty D \
--load_scope q/conv/
python3 main.py --rom {freeway.bin,hero.bin,space_invaders.bin,breakout.bin} \
--random_seed {0,1,2,3,4,5,6,7,8,9} \
--restore_dir {logdir, logdir_with_reg} \
--mode M --difficulty D \
--optimize_scope q/conv/
@article{Farebrother2018a,
author = {Jesse Farebrother and
Marlos C. Machado and
Michael Bowling},
title = {Generalization and Regularization in {DQN}},
journal = {CoRR},
volume = {abs/1810.00123},
year = {2018},
}