From 1d3722d767817642ac222a5cccec32715720d9f1 Mon Sep 17 00:00:00 2001 From: Patrick Virie Date: Tue, 14 Jan 2025 11:23:28 +0700 Subject: [PATCH] adjust epsilon --- tasks/rl_hopper.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/tasks/rl_hopper.py b/tasks/rl_hopper.py index 5d5f195..1c00343 100644 --- a/tasks/rl_hopper.py +++ b/tasks/rl_hopper.py @@ -162,7 +162,7 @@ def setup(): def train(context, parameter_path): course = context.course - num_courses = 2 + num_courses = 3 if course >= num_courses: logging.info("Experiment already completed") @@ -285,7 +285,7 @@ def prepare_data_tuples(states, actions, rewards, num_layers, skip_steps): total_steps = 0 num_trials = 2000 print_steps = max(1, num_trials // 100) - epsilon = 0.8 - 0.7 * (course + 1) / num_courses + epsilon = 0.8 - 0.6 * (course + 1) / num_courses course_statistics = {}