This commit is contained in:
9
tp5.py
9
tp5.py
@@ -104,15 +104,6 @@ def train_and_save(weights_path="cartpole_actor_critic.pth", episodes=500):
|
|||||||
|
|
||||||
print(f'Episode {ep + 1}: total reward {total_r:.1f}')
|
print(f'Episode {ep + 1}: total reward {total_r:.1f}')
|
||||||
|
|
||||||
fig, axes = plt.subplots(1, 2)
|
|
||||||
axes[0].plot(range(len(log_probs)), log_probs)
|
|
||||||
axes[0].set_title('log probability')
|
|
||||||
|
|
||||||
axes[1].plot(range(len(td_errors)), td_errors)
|
|
||||||
axes[1].set_title('TD errors')
|
|
||||||
|
|
||||||
plt.show()
|
|
||||||
|
|
||||||
# Libération des ressources liées à l'environnement
|
# Libération des ressources liées à l'environnement
|
||||||
env.close()
|
env.close()
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user