Skip to content
Snippets Groups Projects
Commit 69ad3981 authored by Brussart Paul-emile's avatar Brussart Paul-emile
Browse files

Added loss vizualisation

parent ec80fa30
No related branches found
No related tags found
No related merge requests found
reinforce_cartpole.png

2.34 KiB

...@@ -28,9 +28,11 @@ optimizer = optim.Adam(model.parameters(), lr=5e-3) ...@@ -28,9 +28,11 @@ optimizer = optim.Adam(model.parameters(), lr=5e-3)
# Keep track of the number of rewards for each episodes # Keep track of the number of rewards for each episodes
rewardsByEpisode = [] rewardsByEpisode = []
lossesByEpisode = []
# training loop # training loop
for episode in range(500): for episode in range(500):
print("Episode's number {0} / {1}".format(episode, 500))
# reset the environment # reset the environment
state = env.reset() state = env.reset()
log_probs = [] log_probs = []
...@@ -69,18 +71,31 @@ for episode in range(500): ...@@ -69,18 +71,31 @@ for episode in range(500):
model_loss.append(-log_prob * return_) model_loss.append(-log_prob * return_)
model_loss = torch.cat(model_loss).sum() model_loss = torch.cat(model_loss).sum()
lossesByEpisode.append(model_loss.item())
# update the model # update the model
optimizer.zero_grad() optimizer.zero_grad()
model_loss.backward() model_loss.backward()
optimizer.step() optimizer.step()
print("N° de l'épisode :", episode)
print("Nombre de rewards :", len(rewards))
# X axis : # X axis :
x = list(range(len(rewardsByEpisode))) x = list(range(len(rewardsByEpisode)))
# Plot Rewards by Episodes
plt.figure("Figure 1")
plt.xlabel('Episodes N°') plt.xlabel('Episodes N°')
plt.ylabel('Number of rewards given') plt.ylabel('Number of rewards given')
plt.plot(x, rewardsByEpisode, '--') plt.plot(x, rewardsByEpisode)
plt.savefig('reinforce_cartpole_reward.png')
plt.show()
# Plot losses by Episodes
plt.figure("Figure 2")
plt.xlabel("Episodes N°")
plt.ylabel("Loss")
plt.plot(x, lossesByEpisode)
plt.title("Loss by episodes")
plt.savefig("reinforce_cartpole_loss.png")
plt.show() plt.show()
plt.savefig('reinforce_cartpole.png')
reinforce_cartpole_loss.png

50.1 KiB

reinforce_cartpole_reward.png

49.4 KiB

0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Please register or to comment