a24b65545e5802b3a7b9e134ca603ee03cef1d1d,ml/rl/test/gridworld/test_gridworld_continuous.py,TestGridworldContinuous,test_evaluator_ground_truth,#TestGridworldContinuous#,141
Before Change
possible_next_actions, reward_timelines
)
trainer.stream_tdp(tdp, evaluator)
self.assertLess(evaluator.td_loss[-1], 0.05)
self.assertLess(evaluator.mc_loss[-1], 0.12)
After Change
self.minibatch_size,
)
for tdp in tdps:
trainer.stream_tdp(tdp, evaluator)
self.assertLess(evaluator.td_loss[-1], 0.05)
self.assertLess(evaluator.mc_loss[-1], 0.12)
def test_evaluator_timeline(self):
In pattern: SUPERPATTERN
Frequency: 5
Non-data size: 4
Instances
Project Name: facebookresearch/Horizon
Commit Name: a24b65545e5802b3a7b9e134ca603ee03cef1d1d
Time: 2018-02-20
Author: jjg@fb.com
File Name: ml/rl/test/gridworld/test_gridworld_continuous.py
Class Name: TestGridworldContinuous
Method Name: test_evaluator_ground_truth
Project Name: facebookresearch/Horizon
Commit Name: a24b65545e5802b3a7b9e134ca603ee03cef1d1d
Time: 2018-02-20
Author: jjg@fb.com
File Name: ml/rl/test/gridworld/test_gridworld.py
Class Name: TestGridworld
Method Name: test_evaluator_timeline
Project Name: facebookresearch/Horizon
Commit Name: a24b65545e5802b3a7b9e134ca603ee03cef1d1d
Time: 2018-02-20
Author: jjg@fb.com
File Name: ml/rl/test/gridworld/test_gridworld.py
Class Name: TestGridworld
Method Name: test_evaluator_ground_truth
Project Name: facebookresearch/Horizon
Commit Name: a24b65545e5802b3a7b9e134ca603ee03cef1d1d
Time: 2018-02-20
Author: jjg@fb.com
File Name: ml/rl/test/gridworld/test_limited_action_gridworld.py
Class Name: TestLimitedActionGridworld
Method Name: test_pure_q_learning_all_cheat
Project Name: facebookresearch/Horizon
Commit Name: a24b65545e5802b3a7b9e134ca603ee03cef1d1d
Time: 2018-02-20
Author: jjg@fb.com
File Name: ml/rl/test/gridworld/test_gridworld_continuous.py
Class Name: TestGridworldContinuous
Method Name: test_evaluator_timeline