From cae7a6271ef86fcaf7c169aefe2cc0b996d7d5bc Mon Sep 17 00:00:00 2001 From: alik-git Date: Wed, 20 Nov 2024 20:21:20 +0000 Subject: [PATCH 1/6] add cmd arg for h5 output path with sensible default --- sim/h5_logger.py | 13 +++++++++++-- sim/sim2sim.py | 11 ++++++++++- 2 files changed, 21 insertions(+), 3 deletions(-) diff --git a/sim/h5_logger.py b/sim/h5_logger.py index a1812fe7..e455ae49 100644 --- a/sim/h5_logger.py +++ b/sim/h5_logger.py @@ -6,22 +6,31 @@ import h5py import matplotlib.pyplot as plt import numpy as np +from datetime import datetime class HDF5Logger: - def __init__(self, data_name: str, num_actions: int, max_timesteps: int, num_observations: int): + def __init__(self, data_name: str, num_actions: int, max_timesteps: int, num_observations: int, h5_out_dir: str = "sim/resources/"): self.data_name = data_name self.num_actions = num_actions self.max_timesteps = max_timesteps self.num_observations = num_observations self.max_threshold = 1e3 # Adjust this threshold as needed + self.h5_out_dir = h5_out_dir self.h5_file, self.h5_dict = self._create_h5_file() self.current_timestep = 0 def _create_h5_file(self): # Create a unique file ID idd = str(uuid.uuid4()) - h5_file = h5py.File(f"{self.data_name}/{idd}.h5", "w") + timestamp = datetime.now().strftime("%Y-%m-%d_%H-%M-%S") + + curr_h5_out_dir = f"{self.h5_out_dir}/{self.data_name}/h5_out/" + os.makedirs(curr_h5_out_dir, exist_ok=True) + + h5_file_path = f"{curr_h5_out_dir}/{timestamp}__{idd}.h5" + print(f"Saving HDF5 data to {h5_file_path}") + h5_file = h5py.File(h5_file_path, "w") # Create datasets for logging actions and observations dset_actions = h5_file.create_dataset("prev_actions", (self.max_timesteps, self.num_actions), dtype=np.float32) diff --git a/sim/sim2sim.py b/sim/sim2sim.py index 9945067e..9799964f 100755 --- a/sim/sim2sim.py +++ b/sim/sim2sim.py @@ -110,6 +110,7 @@ def run_mujoco( keyboard_use: bool = False, log_h5: bool = False, render: bool = True, + h5_out_dir: str = "sim/resources", ) -> None: """ Run the Mujoco simulation using the provided policy and configuration. @@ -178,7 +179,13 @@ def run_mujoco( if log_h5: stop_state_log = int(cfg.sim_duration / cfg.dt) / cfg.decimation - logger = HDF5Logger(embodiment, model_info["num_actions"], stop_state_log, model_info["num_observations"]) + logger = HDF5Logger( + data_name=embodiment, + num_actions=model_info["num_actions"], + max_timesteps=stop_state_log, + num_observations=model_info["num_observations"], + h5_out_dir=h5_out_dir + ) # Initialize variables for tracking upright steps and average speed upright_steps = 0 @@ -312,6 +319,7 @@ def parse_modelmeta( parser.add_argument("--load_model", type=str, required=True, help="Path to run to load from.") parser.add_argument("--keyboard_use", action="store_true", help="keyboard_use") parser.add_argument("--log_h5", action="store_true", help="log_h5") + parser.add_argument("--h5_out_dir", type=str, default="sim/resources", help="Directory to save HDF5 files") parser.add_argument("--no_render", action="store_false", dest="render", help="Disable rendering") parser.set_defaults(render=True) args = parser.parse_args() @@ -363,4 +371,5 @@ def parse_modelmeta( args.keyboard_use, args.log_h5, args.render, + args.h5_out_dir, ) From 833f03a73515f564f667267d831775d10798eb4c Mon Sep 17 00:00:00 2001 From: alik-git Date: Wed, 20 Nov 2024 22:26:37 +0000 Subject: [PATCH 2/6] save current actions to h5 --- sim/h5_logger.py | 6 ++++-- sim/sim2sim.py | 1 + 2 files changed, 5 insertions(+), 2 deletions(-) diff --git a/sim/h5_logger.py b/sim/h5_logger.py index e455ae49..81f123bb 100644 --- a/sim/h5_logger.py +++ b/sim/h5_logger.py @@ -33,7 +33,7 @@ def _create_h5_file(self): h5_file = h5py.File(h5_file_path, "w") # Create datasets for logging actions and observations - dset_actions = h5_file.create_dataset("prev_actions", (self.max_timesteps, self.num_actions), dtype=np.float32) + dset_prev_actions = h5_file.create_dataset("prev_actions", (self.max_timesteps, self.num_actions), dtype=np.float32) dset_2D_command = h5_file.create_dataset("observations/2D_command", (self.max_timesteps, 2), dtype=np.float32) dset_3D_command = h5_file.create_dataset("observations/3D_command", (self.max_timesteps, 3), dtype=np.float32) dset_q = h5_file.create_dataset("observations/q", (self.max_timesteps, self.num_actions), dtype=np.float32) @@ -42,10 +42,12 @@ def _create_h5_file(self): dset_euler = h5_file.create_dataset("observations/euler", (self.max_timesteps, 3), dtype=np.float32) dset_t = h5_file.create_dataset("observations/t", (self.max_timesteps, 1), dtype=np.float32) dset_buffer = h5_file.create_dataset("observations/buffer", (self.max_timesteps, self.num_observations), dtype=np.float32) + dset_curr_actions = h5_file.create_dataset("curr_actions", (self.max_timesteps, self.num_actions), dtype=np.float32) # Map datasets for easy access h5_dict = { - "prev_actions": dset_actions, + "prev_actions": dset_prev_actions, + "curr_actions": dset_curr_actions, "2D_command": dset_2D_command, "3D_command": dset_3D_command, "joint_pos": dset_q, diff --git a/sim/sim2sim.py b/sim/sim2sim.py index 9799964f..3474fbfa 100755 --- a/sim/sim2sim.py +++ b/sim/sim2sim.py @@ -252,6 +252,7 @@ def run_mujoco( "joint_pos": cur_pos_obs.astype(np.float32), "joint_vel": cur_vel_obs.astype(np.float32), "prev_actions": actions.astype(np.float32), + "curr_actions": target_q.astype(np.float32), "ang_vel": omega.astype(np.float32), "euler_rotation": eu_ang.astype(np.float32), "buffer": hist_obs.astype(np.float32) From 6a65d01905f9dc57341a81c5af7fd5e4f25a2aa0 Mon Sep 17 00:00:00 2001 From: alik-git Date: Wed, 20 Nov 2024 23:33:21 +0000 Subject: [PATCH 3/6] add h5out as arg to produce_sim_data as well --- sim/produce_sim_data.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/sim/produce_sim_data.py b/sim/produce_sim_data.py index 69f7e19e..a85f8f33 100644 --- a/sim/produce_sim_data.py +++ b/sim/produce_sim_data.py @@ -17,6 +17,8 @@ def run_simulation(sim_idx: int, args: argparse.Namespace) -> None: "--load_model", args.load_model, "--log_h5", + "--h5_out_dir", + args.h5_out_dir, "--no_render", ] @@ -48,6 +50,7 @@ def run_parallel_sims(num_threads: int, args: argparse.Namespace) -> None: parser.add_argument("--embodiment", default="stompypro", type=str, help="Embodiment name") parser.add_argument("--load_model", default="examples/walking_pro.onnx", type=str, help="Path to model to load") parser.add_argument("--num_examples", default=10000, type=int, help="Number of examples to run") + parser.add_argument("--h5_out_dir", default="sim/resources", type=str, help="Directory to save HDF5 files") args = parser.parse_args() # Run 100 examples total, in parallel batches From df09d0dbca67ef03385babc5a02c9c8aed64555f Mon Sep 17 00:00:00 2001 From: alik-git Date: Wed, 20 Nov 2024 23:39:57 +0000 Subject: [PATCH 4/6] compute actions before saving them --- sim/sim2sim.py | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/sim/sim2sim.py b/sim/sim2sim.py index 3474fbfa..04206a7e 100755 --- a/sim/sim2sim.py +++ b/sim/sim2sim.py @@ -237,6 +237,9 @@ def run_mujoco( input_data["imu_euler_xyz.1"] = eu_ang.astype(np.float32) input_data["buffer.1"] = hist_obs.astype(np.float32) + + positions, actions, hist_obs = policy.run(None, input_data) + target_q = positions if args.log_h5: logger.log_data({ @@ -258,8 +261,6 @@ def run_mujoco( "buffer": hist_obs.astype(np.float32) }) - positions, actions, hist_obs = policy.run(None, input_data) - target_q = positions # Generate PD control tau = pd_control(target_q, q, kps, dq, kds, default) # Calc torques From 102a7702f33de9c45b2be0676a9e82229572b0ab Mon Sep 17 00:00:00 2001 From: alik-git Date: Wed, 20 Nov 2024 23:41:32 +0000 Subject: [PATCH 5/6] typo fix: args.log_h5 -> log_h5 --- sim/sim2sim.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/sim/sim2sim.py b/sim/sim2sim.py index 04206a7e..cd20854f 100755 --- a/sim/sim2sim.py +++ b/sim/sim2sim.py @@ -241,7 +241,7 @@ def run_mujoco( positions, actions, hist_obs = policy.run(None, input_data) target_q = positions - if args.log_h5: + if log_h5: logger.log_data({ "t": np.array([count_lowlevel * cfg.dt], dtype=np.float32), "2D_command": np.array( @@ -286,7 +286,7 @@ def run_mujoco( print(f"Number of upright steps: {upright_steps}") print(f"Average speed: {average_speed:.4f} m/s") - if args.log_h5: + if log_h5: logger.close() From 0eb70d3f0eb9f990abdc65cef15ba2b5859d121e Mon Sep 17 00:00:00 2001 From: alik-git Date: Thu, 21 Nov 2024 00:29:14 +0000 Subject: [PATCH 6/6] fix: rename actions to prev_actions, and set prev_action to curr_action at the end of loop --- sim/sim2sim.py | 17 +++++++++-------- 1 file changed, 9 insertions(+), 8 deletions(-) diff --git a/sim/sim2sim.py b/sim/sim2sim.py index cd20854f..292462b5 100755 --- a/sim/sim2sim.py +++ b/sim/sim2sim.py @@ -159,7 +159,7 @@ def run_mujoco( viewer = mujoco_viewer.MujocoViewer(model, data) target_q = np.zeros((model_info["num_actions"]), dtype=np.double) - actions = np.zeros((model_info["num_actions"]), dtype=np.double) + prev_actions = np.zeros((model_info["num_actions"]), dtype=np.double) hist_obs = np.zeros((model_info["num_observations"]), dtype=np.double) count_lowlevel = 0 @@ -231,16 +231,16 @@ def run_mujoco( input_data["dof_pos.1"] = cur_pos_obs.astype(np.float32) input_data["dof_vel.1"] = cur_vel_obs.astype(np.float32) - input_data["prev_actions.1"] = actions.astype(np.float32) + input_data["prev_actions.1"] = prev_actions.astype(np.float32) input_data["imu_ang_vel.1"] = omega.astype(np.float32) input_data["imu_euler_xyz.1"] = eu_ang.astype(np.float32) input_data["buffer.1"] = hist_obs.astype(np.float32) - - positions, actions, hist_obs = policy.run(None, input_data) - target_q = positions + positions, curr_actions, hist_obs = policy.run(None, input_data) + target_q = positions + if log_h5: logger.log_data({ "t": np.array([count_lowlevel * cfg.dt], dtype=np.float32), @@ -254,13 +254,14 @@ def run_mujoco( "3D_command": np.array([x_vel_cmd, y_vel_cmd, yaw_vel_cmd], dtype=np.float32), "joint_pos": cur_pos_obs.astype(np.float32), "joint_vel": cur_vel_obs.astype(np.float32), - "prev_actions": actions.astype(np.float32), - "curr_actions": target_q.astype(np.float32), + "prev_actions": prev_actions.astype(np.float32), + "curr_actions": curr_actions.astype(np.float32), "ang_vel": omega.astype(np.float32), "euler_rotation": eu_ang.astype(np.float32), "buffer": hist_obs.astype(np.float32) }) - + + prev_actions = curr_actions # Generate PD control tau = pd_control(target_q, q, kps, dq, kds, default) # Calc torques