给个体的一个观测(状态)生成一个不重复的字符串作为Q、E字典里的键 ''' return str(state) def _get_(self, QorE _assert_state_in_QE(s, randomized=True) return QorE[s][a] def _set_(self, QorE, s, a, value _assert_state_in_QE(s, randomized=True) QorE[s][a] = value def _resetEValue(self):
(状态)生成一个不重复的字符串作为Q、E字典里的键 ''' return str(state) def _get_(self, QorE _assert_state_in_QE(s, randomized=True) return QorE[s][a] def _set_(self, QorE, s, a, value _assert_state_in_QE(s, randomized=True) QorE[s][a] = value def _resetEValue(self):