bdd1a023482b34aa9980c64b434ce75824e16543,sac/policies/gmm.py,GMMPolicy,get_action,#GMMPolicy#Any#,75
Before Change
raise AttributeError
// Get first the GMM means.
feeds = {self._obs_pl: obs[None]}
mus = tf .get_default_session().run(self._dist.mus_t , feeds)[0] // K x Da
qs = self._qf.eval(obs[None], mus)
if self._fixed_h is not None:
h = self._fixed_h
else:
h = np.argmax(qs)
return mus[h, :], {} // Da
@contextmanager
def fix_h(self, h):
After Change
TODO: Modify `NNPolicy.get_action` and remove this
return self.get_actions(observation[None])[0], {}
@overrides
def get_actions(self, obs):
Sample actions based on the observations.
In pattern: SUPERPATTERN
Frequency: 5
Non-data size: 7
Instances Project Name: rail-berkeley/softlearning
Commit Name: bdd1a023482b34aa9980c64b434ce75824e16543
Time: 2018-05-22
Author: kristian.hartikainen@gmail.com
File Name: sac/policies/gmm.py
Class Name: GMMPolicy
Method Name: get_action
Project Name: arnomoonens/yarll
Commit Name: 2b77a13f3870712284122f2a5411c7d4b8db82e6
Time: 2019-06-09
Author: arno.moonens@gmail.com
File Name: yarll/agents/sac.py
Class Name: SAC
Method Name: softq_value
Project Name: arnomoonens/yarll
Commit Name: 2b77a13f3870712284122f2a5411c7d4b8db82e6
Time: 2019-06-09
Author: arno.moonens@gmail.com
File Name: yarll/agents/sac.py
Class Name: SAC
Method Name: actions
Project Name: arnomoonens/yarll
Commit Name: 2b77a13f3870712284122f2a5411c7d4b8db82e6
Time: 2019-06-09
Author: arno.moonens@gmail.com
File Name: yarll/agents/sac.py
Class Name: SAC
Method Name: value
Project Name: arnomoonens/yarll
Commit Name: 2b77a13f3870712284122f2a5411c7d4b8db82e6
Time: 2019-06-09
Author: arno.moonens@gmail.com
File Name: yarll/agents/sac.py
Class Name: SAC
Method Name: target_value