| hyperparams = dict( | |
| batch_size=128, | |
| exploration_rate=1, | |
| exploration_rate_decay=0.99999, | |
| exploration_rate_min=0.01, | |
| training_frequency=1, | |
| target_network_sync_frequency=20, | |
| max_memory_size=1000000, | |
| learning_rate=0.001, | |
| learning_starts=128, | |
| save_frequency=100000 | |
| ) | |