SwatGarg commited on
Commit
535ba6d
1 Parent(s): de2ee39

Update q_learning_chatbot.py

Browse files
Files changed (1) hide show
  1. q_learning_chatbot.py +1 -1
q_learning_chatbot.py CHANGED
@@ -49,7 +49,7 @@ class QLearningChatbot:
49
  next_state_index = self.states.index(next_state)
50
 
51
  current_q_value = self.q_values[current_state_index]
52
- max_next_q_value = np.max(self.q_values[next_state_index, :])
53
 
54
  new_q_value = current_q_value + self.learning_rate * (reward + self.discount_factor * max_next_q_value - current_q_value)
55
  self.q_values[current_state_index] = new_q_value
 
49
  next_state_index = self.states.index(next_state)
50
 
51
  current_q_value = self.q_values[current_state_index]
52
+ max_next_q_value = np.max(self.q_values[next_state_index])
53
 
54
  new_q_value = current_q_value + self.learning_rate * (reward + self.discount_factor * max_next_q_value - current_q_value)
55
  self.q_values[current_state_index] = new_q_value