5c81c1c3138d296b8ac5f836e118cfb849b7bf5d,softqlearning/algos/softqlearning.py,SoftQLearning,_evaluate,#SoftQLearning#Any#,464
Before Change
("Epoch", epoch),
("Alpha", self._alpha),
("DiscountedReturnAvg", average_discounted_return),
("TotalReturnAvg", np.mean(total_returns)),
("TotalReturnMin", np.min(total_returns)),
("TotalReturnMax", np.max(total_returns)),
("TotalReturnStd", np.std(total_returns))
])
for key, value in statistics.items():
After Change
]
episode_lengths = [
len(p["rewards"]) for p in paths
]
statistics = OrderedDict([
In pattern: SUPERPATTERN
Frequency: 3
Non-data size: 5
Instances
Project Name: rail-berkeley/softlearning
Commit Name: 5c81c1c3138d296b8ac5f836e118cfb849b7bf5d
Time: 2018-05-22
Author: haarnoja@berkeley.edu
File Name: softqlearning/algos/softqlearning.py
Class Name: SoftQLearning
Method Name: _evaluate
Project Name: rlworkgroup/garage
Commit Name: 5e11b5f80351db52dfdda4311c505a47ed9abcb5
Time: 2020-01-10
Author: zequnyu@usc.edu
File Name: src/garage/tf/algos/batch_polopt.py
Class Name: BatchPolopt
Method Name: process_samples
Project Name: ScottfreeLLC/AlphaPy
Commit Name: 1c34f59317bf1944391babe902aeab480324a630
Time: 2016-10-09
Author: Mark.R.Conway@gmail.com
File Name: optimize.py
Class Name:
Method Name: hyper_grid_search