2from droneRobot
import DroneRobot
5from stable_baselines3
import TD3
6from stable_baselines3.common.noise
import OrnsteinUhlenbeckActionNoise
9model_path = os.path.join(
'Training',
'Saved Models', f
'td3_drone_model{datetime.datetime.now().strftime("%Y_%m_%d_%H_%M_%S")}')
11log_path = os.path.join(
'Training',
'Logs',
'td3_drone_logs')
15env.target_location = [0, 0, 2]
19n_actions = env.action_space.shape[-1]
22action_noise = OrnsteinUhlenbeckActionNoise(mean=np.zeros(n_actions), sigma=float(0.1) * np.ones(n_actions))
26env.startTensorBoard(log_path)
30timesteps = env.steps_per_episode * episodes
33model = TD3(
"MlpPolicy", env, action_noise=action_noise, verbose=1, device=
'cuda', tensorboard_log=log_path)
41model.learn(total_timesteps=timesteps, log_interval=10)
45model.save(
"td3_drone_model", path=model_path)