Q = np.zeros([env.observation_space.n, env.action_space.n]) print(Q)