1 2
| import gym import random
|
1 2 3 4 5 6 7
| env_name = 'CartPole-v1' env_name='FrozenLake8x8-v1'
env = gym.make(env_name) print("Observation space:",env.observation_space) print('Action space:',env.action_space)
|
Observation space: Discrete(64)
Action space: Discrete(4)
1 2 3 4 5 6 7 8
| class Agent(): def __init__(self,env): self.action_size = env.action_space.n print(self.action_size) def get_action(self,state): action=random.choice(range(self.action_size)) return action
|
1 2 3 4 5 6 7 8
| state=env.reset() agent = Agent(env) for _ in range(200): action = agent.get_action(state) state,reward,done,info=env.step(action) env.render()
|
4
若你觉得我的文章对你有帮助,欢迎点击上方按钮对我打赏