test_gym.py 600 B

123456789101112131415161718192021222324
  1. import gym
  2. import time
  3. # 生成环境
  4. env = gym.make('CartPole-v1', render_mode='human')
  5. # 环境初始化
  6. state = env.reset(seed=1)
  7. # 循环交互
  8. while True:
  9. # 渲染画面
  10. # env.render()
  11. # 从动作空间随机获取一个动作
  12. action = env.action_space.sample()
  13. # agent与环境进行一步交互
  14. state, reward, terminated, truncated, info = env.step(action)
  15. print('state = {0}; reward = {1}'.format(state, reward))
  16. # 判断当前episode 是否完成
  17. if terminated:
  18. print('terminated')
  19. break
  20. time.sleep(0.1)
  21. # 环境结束
  22. # env.close()