5c81c1c3138d296b8ac5f836e118cfb849b7bf5d,softqlearning/algos/softqlearning.py,SoftQLearning,_evaluate,#SoftQLearning#Any#,464

Before Change


            ("Epoch", epoch),
            ("Alpha", self._alpha),
            ("DiscountedReturnAvg", average_discounted_return),
            ("TotalReturnAvg", np.mean(total_returns)),
            ("TotalReturnMin", np.min(total_returns)),
            ("TotalReturnMax", np.max(total_returns)),
            ("TotalReturnStd", np.std(total_returns))
        ])

        for key, value in statistics.items():

After Change


        ]

        episode_lengths = [
            len(p["rewards"]) for p in paths
        ]

        statistics = OrderedDict([
Italian Trulli
In pattern: SUPERPATTERN

Frequency: 3

Non-data size: 5

Instances


Project Name: rail-berkeley/softlearning
Commit Name: 5c81c1c3138d296b8ac5f836e118cfb849b7bf5d
Time: 2018-05-22
Author: haarnoja@berkeley.edu
File Name: softqlearning/algos/softqlearning.py
Class Name: SoftQLearning
Method Name: _evaluate


Project Name: rlworkgroup/garage
Commit Name: 5e11b5f80351db52dfdda4311c505a47ed9abcb5
Time: 2020-01-10
Author: zequnyu@usc.edu
File Name: src/garage/tf/algos/batch_polopt.py
Class Name: BatchPolopt
Method Name: process_samples


Project Name: ScottfreeLLC/AlphaPy
Commit Name: 1c34f59317bf1944391babe902aeab480324a630
Time: 2016-10-09
Author: Mark.R.Conway@gmail.com
File Name: optimize.py
Class Name:
Method Name: hyper_grid_search