diff --git a/examples/ppo_hover_train.py b/examples/ppo_hover_train.py index 30d7368..a08494b 100644 --- a/examples/ppo_hover_train.py +++ b/examples/ppo_hover_train.py @@ -77,6 +77,6 @@ while True: # Run indefinitely.. model.learn(total_timesteps=num_timesteps, reset_num_timesteps=False, tb_log_name="PPO-Quad_"+start_time.strftime('%H-%M-%S')) # Save the model - model.save(f"{models_dir}/PPO_hover_policy_{num_timesteps*(epoch_count+1)}") + model.save(f"{models_dir}/PPO/{start_time.strftime('%H-%M-%S')}/hover_{num_timesteps*(epoch_count+1)}") epoch_count += 1 \ No newline at end of file