```python
class QLearningAgent(agent.BaseAgent):
def agent_init(self, agent_init_info):
self.num_actions = agent_init_info[“num_actions”]
self.num_states = agent_init_info[“num_states”]
self.epsilon = agent_init_info[“epsilon”]
self.step_size = agent_init_info[“step_size”]
self.discount = agent_init_info[“discount”]
self.rand_generator = np.random.RandomState(agent_info[“seed”])
self.q = np.zeros((self.num_states, self.num_actions)) # The array of action-value estimates.
[Read More]