a55f9be217b2320cec7c7dc44a8245496f851af5,softlearning/algorithms/sac.py,SAC,_init_placeholders,#SAC#,120

Before Change


        )

        if self._store_extra_policy_info:
            self._log_pis_ph = tf.placeholder(
                tf.float32,
                shape=(None, 1),
                name="log_pis",
            )
            self._raw_actions_ph = tf.placeholder(
                tf.float32,
                shape=(None, *self._action_shape),
                name="raw_actions",
            )

    def _get_Q_target(self):
        next_actions = self._policy.actions([self._next_observations_ph])
        next_log_pis = self._policy.log_pis(

After Change


            - reward
            - terminals
        
        self._placeholders = {
            "iteration": tf.placeholder(
                tf.int64, shape=None, name="iteration",
            ),
            "observations": tf.placeholder(
                tf.float32,
                shape=(None, *self._observation_shape),
                name="observation",
            ),
            "next_observations": tf.placeholder(
                tf.float32,
                shape=(None, *self._observation_shape),
                name="next_observation",
            ),
            "actions": tf.placeholder(
                tf.float32,
                shape=(None, *self._action_shape),
                name="actions",
            ),
            "rewards": tf.placeholder(
                tf.float32,
                shape=(None, 1),
                name="rewards",
            ),
            "terminals": tf.placeholder(
                tf.bool,
                shape=(None, 1),
                name="terminals",
            ),
        }

    def _get_Q_target(self):
        next_observations = self._placeholders["next_observations"]
        next_actions = self._policy.actions([next_observations])
Italian Trulli
In pattern: SUPERPATTERN

Frequency: 4

Non-data size: 5

Instances


Project Name: rail-berkeley/softlearning
Commit Name: a55f9be217b2320cec7c7dc44a8245496f851af5
Time: 2019-06-01
Author: hartikainen@berkeley.edu
File Name: softlearning/algorithms/sac.py
Class Name: SAC
Method Name: _init_placeholders


Project Name: reinforceio/tensorforce
Commit Name: f52db36a739dfd7385c7bb5c60593debbbc3a8b1
Time: 2017-04-08
Author: mi.schaarschmidt@gmail.com
File Name: tensorforce/models/naf_model.py
Class Name: NAFModel
Method Name: __init__


Project Name: reinforceio/tensorforce
Commit Name: a504ed5cfb74a4a8531ef85deb315d6a4ed0b4cf
Time: 2017-04-09
Author: mi.schaarschmidt@gmail.com
File Name: tensorforce/models/distributed_pg_model.py
Class Name: DistributedPGModel
Method Name: __init__


Project Name: rail-berkeley/softlearning
Commit Name: a55f9be217b2320cec7c7dc44a8245496f851af5
Time: 2019-06-01
Author: hartikainen@berkeley.edu
File Name: softlearning/algorithms/sql.py
Class Name: SQL
Method Name: _init_placeholders