5a126fc7cac272dfe2514554ef228001c795d729,slm_lab/agent/algorithm/sac.py,SoftActorCritic,act,#SoftActorCritic#Any#,85

Before Change


            return policy_util.random(state, self, self.body).cpu().squeeze().numpy()
        else:
            action = super().act(state)
            return np.tanh(action)  // continuous action bound

    def calc_q(self, state, action, net=None):
        """Forward-pass to calculate the predicted state-action-value from q1_net."""

After Change


            return policy_util.random(state, self, self.body).cpu().squeeze().numpy()
        else:
            action = self.action_policy(state, self, self.body)
            if self.body.is_discrete:
                // discrete output is RelaxedOneHotCategorical, need to sample to int. clamp to prevent minor precision issue with prob < 0
                action = torch.distributions.Categorical(probs=action.clamp(min=0)).sample()
            else:
                action = torch.tanh(action)  // continuous action bound
            return action.cpu().squeeze().numpy()

    def calc_q(self, state, action, net=None):
        """Forward-pass to calculate the predicted state-action-value from q1_net."""

In pattern: SUPERPATTERN

Frequency: 3

Non-data size: 3

Instances

Link

Project Name: kengz/SLM-Lab

Commit Name: 5a126fc7cac272dfe2514554ef228001c795d729

Time: 2019-08-03

Author: kengzwl@gmail.com

File Name: slm_lab/agent/algorithm/sac.py

Class Name: SoftActorCritic

Method Name: act

Link

Project Name: scikit-optimize/scikit-optimize

Commit Name: 7bd676c9ab6b23ec93499fd72aeadee3a334a163

Time: 2017-08-18

Author: betatim@gmail.com

File Name: skopt/utils.py

Class Name:

Method Name: normalize_dimensions

Link

Project Name: dmnfarrell/pandastable

Commit Name: 9bf47c410efde68615d18265078e9cd317007103

Time: 2017-08-04

Author: farrell.damien@gmail.com

File Name: pandastable/plugins/mdanalysis.py

Class Name:

Method Name: feature_selection