This commit is contained in:
9
tp5.py
9
tp5.py
@@ -104,15 +104,6 @@ def train_and_save(weights_path="cartpole_actor_critic.pth", episodes=500):
|
||||
|
||||
print(f'Episode {ep + 1}: total reward {total_r:.1f}')
|
||||
|
||||
fig, axes = plt.subplots(1, 2)
|
||||
axes[0].plot(range(len(log_probs)), log_probs)
|
||||
axes[0].set_title('log probability')
|
||||
|
||||
axes[1].plot(range(len(td_errors)), td_errors)
|
||||
axes[1].set_title('TD errors')
|
||||
|
||||
plt.show()
|
||||
|
||||
# Libération des ressources liées à l'environnement
|
||||
env.close()
|
||||
|
||||
|
||||
Reference in New Issue
Block a user