From fb411559b20e9bf55d759e6c390f4f13fac72677 Mon Sep 17 00:00:00 2001 From: Jonas Rothfuss Date: Tue, 28 Nov 2023 10:16:15 +0100 Subject: [PATCH 1/3] bugfix --- experiments/online_rl_hardware/online_rl_loop.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/experiments/online_rl_hardware/online_rl_loop.py b/experiments/online_rl_hardware/online_rl_loop.py index 94e9213..fdc55ce 100644 --- a/experiments/online_rl_hardware/online_rl_loop.py +++ b/experiments/online_rl_hardware/online_rl_loop.py @@ -332,7 +332,7 @@ def policy(x): parser.add_argument('--gpu', type=int, default=1) parser.add_argument('--prior', type=str, default='none_FVSGD') - parser.add_argument('--num_env_steps', type=int, default=200, info='number of steps in the environment per episode') + parser.add_argument('--num_env_steps', type=int, default=200, help='number of steps in the environment per episode') parser.add_argument('--reset_bnn', type=int, default=0) args = parser.parse_args() From 9dfdabb3b3163805cb460a5aff538faf827ed522 Mon Sep 17 00:00:00 2001 From: Jonas Rothfuss Date: Tue, 28 Nov 2023 10:27:19 +0100 Subject: [PATCH 2/3] bugfix in euler gpu cmd generation --- experiments/util.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/experiments/util.py b/experiments/util.py index be2be7e..1ddf645 100644 --- a/experiments/util.py +++ b/experiments/util.py @@ -149,7 +149,7 @@ def generate_run_commands(command_list: List[str], output_file_list: Optional[Li f'--cpus-per-task {num_cpus} ' if num_gpus > 0: - bsub_cmd += f'-G {num_gpus} --gres=gpumem:10240m' + bsub_cmd += f'-G {num_gpus} --gres=gpumem:10240m ' assert output_file_list is None or len(command_list) == len(output_file_list) if output_file_list is None: From 2de7794114bcbfecd892bc36224794046dad6d80 Mon Sep 17 00:00:00 2001 From: Jonas Rothfuss Date: Tue, 28 Nov 2023 13:52:55 +0100 Subject: [PATCH 3/3] update online_rl_hardware launcher --- experiments/online_rl_hardware/launcher.py | 7 +++---- 1 file changed, 3 insertions(+), 4 deletions(-) diff --git a/experiments/online_rl_hardware/launcher.py b/experiments/online_rl_hardware/launcher.py index 6d7a7f9..8fb0f9f 100644 --- a/experiments/online_rl_hardware/launcher.py +++ b/experiments/online_rl_hardware/launcher.py @@ -3,12 +3,11 @@ def main(args): _applicable_configs = { - 'prior': ['none_FVSGD', 'none_SVGD', 'high_fidelity', 'low_fidelity'], # 'high_fidelity_no_aditive_GP'], + 'prior': ['none_FVSGD', 'none_SVGD', 'high_fidelity', 'low_fidelity'], 'seed': list(range(5)), - 'run_remote': [0], + 'machine': ['local'], 'gpu': [1], - 'wandb_tag': ['gpu' if args.num_gpus > 0 else 'cpu'], - 'project_name': ['OnlineRLDebug3'], + 'project_name': ['OnlineRLDebug4'], } all_flags_combinations = dict_permutations(_applicable_configs)