a55f9be217b2320cec7c7dc44a8245496f851af5,softlearning/algorithms/sac.py,SAC,_init_placeholders,#SAC#,120

Before Change


        )

        if self._store_extra_policy_info:
            self._log_pis_ph = tf.placeholder(
                tf.float32,
                shape=(None, 1),
                name="log_pis",
            )
            self._raw_actions_ph = tf.placeholder(
                tf.float32,
                shape=(None, *self._action_shape),
                name="raw_actions",
            )

    def _get_Q_target(self):
        next_actions = self._policy.actions([self._next_observations_ph])
        next_log_pis = self._policy.log_pis(

After Change


            - reward
            - terminals
        
        self._placeholders = {
            "iteration": tf.placeholder(
                tf.int64, shape=None, name="iteration",
            ),
            "observations": tf.placeholder(
                tf.float32,
                shape=(None, *self._observation_shape),
                name="observation",
            ),
            "next_observations": tf.placeholder(
                tf.float32,
                shape=(None, *self._observation_shape),
                name="next_observation",
            ),
            "actions": tf.placeholder(
                tf.float32,
                shape=(None, *self._action_shape),
                name="actions",
            ),
            "rewards": tf.placeholder(
                tf.float32,
                shape=(None, 1),
                name="rewards",
            ),
            "terminals": tf.placeholder(
                tf.bool,
                shape=(None, 1),
                name="terminals",
            ),
        }

    def _get_Q_target(self):
        next_observations = self._placeholders["next_observations"]
        next_actions = self._policy.actions([next_observations])

In pattern: SUPERPATTERN

Frequency: 4

Non-data size: 5

Instances

Link

Project Name: rail-berkeley/softlearning

Commit Name: a55f9be217b2320cec7c7dc44a8245496f851af5

Time: 2019-06-01

Author: hartikainen@berkeley.edu

File Name: softlearning/algorithms/sac.py

Class Name: SAC

Method Name: _init_placeholders

Link

Project Name: reinforceio/tensorforce

Commit Name: f52db36a739dfd7385c7bb5c60593debbbc3a8b1

Time: 2017-04-08

Author: mi.schaarschmidt@gmail.com

File Name: tensorforce/models/naf_model.py

Class Name: NAFModel

Method Name: __init__

Link

Project Name: reinforceio/tensorforce

Commit Name: a504ed5cfb74a4a8531ef85deb315d6a4ed0b4cf

Time: 2017-04-09

Author: mi.schaarschmidt@gmail.com

File Name: tensorforce/models/distributed_pg_model.py

Class Name: DistributedPGModel

Method Name: __init__

Link

Project Name: rail-berkeley/softlearning

Commit Name: a55f9be217b2320cec7c7dc44a8245496f851af5

Time: 2019-06-01

Author: hartikainen@berkeley.edu

File Name: softlearning/algorithms/sql.py

Class Name: SQL

Method Name: _init_placeholders