diff --git a/a2c_sb3_cartpole.py b/a2c_sb3_cartpole.py new file mode 100644 index 0000000000000000000000000000000000000000..2ec8cf2f9e908f5632d15140690b5a7590ea03f0 --- /dev/null +++ b/a2c_sb3_cartpole.py @@ -0,0 +1,25 @@ +import gym +from stable_baselines3 import A2C +from stable_baselines3.common.vec_env import DummyVecEnv + +# Create the CartPole environment +env = gym.make('CartPole-v1') + +# Wrap the environment in a DummyVecEnv to handle multiple environments +env = DummyVecEnv([lambda: env]) + +# Initialize the A2C model +model = A2C('MlpPolicy', env, verbose=1) + +# Train the model for 1000 steps +model.learn(total_timesteps=1000) + +#Saving the model +model.save("a2c_sb3_cartpole") + +# Test the trained model +obs = env.reset() +for i in range(1000): + action, _states = model.predict(obs) + obs, rewards, dones, info = env.step(action) + env.render() \ No newline at end of file diff --git a/a2c_sb3_cartpole.zip b/a2c_sb3_cartpole.zip new file mode 100644 index 0000000000000000000000000000000000000000..dcdd8f98dadad7d68949ea2532160edac56bdfdb Binary files /dev/null and b/a2c_sb3_cartpole.zip differ