Skip to content
Snippets Groups Projects
Commit 6f5dc483 authored by Ghelfi Manon's avatar Ghelfi Manon
Browse files

Upload New File

parent dd38e6d5
No related branches found
No related tags found
No related merge requests found
import gym
from stable_baselines3 import A2C
env = gym.make("CartPole-v1")
model = A2C("MlpPolicy", env, verbose=1)
model.learn(total_timesteps=10000)
model.save("a2c_sb3_cartpole")
vec_env = model.get_env()
obs = vec_env.reset()
for i in range(1000):
action, _state = model.predict(obs, deterministic=True)
obs, reward, done, info = vec_env.step(action)
vec_env.render()
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Please register or to comment