diff --git a/cleanrl/dqn.py b/cleanrl/dqn.py index bb668164..2c9da757 100644 --- a/cleanrl/dqn.py +++ b/cleanrl/dqn.py @@ -70,7 +70,7 @@ def parse_args(): help="the batch size of sample from the reply memory") parser.add_argument("--start-e", type=float, default=1, help="the starting epsilon for exploration") - parser.add_argument("--end-e", type=float, default=0, + parser.add_argument("--end-e", type=float, default=0.05, help="the ending epsilon for exploration") parser.add_argument("--exploration-fraction", type=float, default=0.5, help="the fraction of `total-timesteps` it takes from start-e to go end-e")