fa2cd0c7f0d382d2bb3726e9cec392962b9e35a0,mushroom/algorithms/batch_td.py,DeepFQI,draw_action,#DeepFQI#Any#,139
Before Change
else:
extended_state = self._buffer.get()
action = super(DeepFQI, self).draw_action(extended_state)
self._episode_steps += 1
After Change
else:
extended_state = self._buffer.get()
if not np.random.uniform() < self.policy._epsilon(extended_state):
q = np.ones(self.mdp_info["action_space"].n)
for i in xrange(q.size):
features = self._extractor.models[i].predict(
np.expand_dims(extended_state, axis=0))
q[i] = self.approximator.predict(features)
return np.array(
[np.random.choice(np.argwhere(q == np.max(q)).ravel())])
return self.mdp_info["action_space"].sample()
self._episode_steps += 1
return action
In pattern: SUPERPATTERN
Frequency: 3
Non-data size: 4
Instances
Project Name: AIRLab-POLIMI/mushroom
Commit Name: fa2cd0c7f0d382d2bb3726e9cec392962b9e35a0
Time: 2017-09-11
Author: carlo.deramo@gmail.com
File Name: mushroom/algorithms/batch_td.py
Class Name: DeepFQI
Method Name: draw_action
Project Name: kengz/SLM-Lab
Commit Name: 5a126fc7cac272dfe2514554ef228001c795d729
Time: 2019-08-03
Author: kengzwl@gmail.com
File Name: slm_lab/agent/algorithm/sac.py
Class Name: SoftActorCritic
Method Name: act
Project Name: havakv/pycox
Commit Name: 6671f9d02fc5e90d3d64dfa7bf4f9f9abd0826f1
Time: 2019-02-19
Author: haavard.kvamme@gmail..com
File Name: pycox/models/cox_cc.py
Class Name: CoxTime
Method Name: compute_baseline_hazards