45496de13b7932d8ec860da06f14d113000803be,ml/rl/test/gridworld/test_gridworld_pytorch.py,TestGridworld,test_reward_boost,#TestGridworld#,114
Before Change
)
self.assertGreater(evaluator.mc_loss[-1], 0.12)
for _ in range(2):
for tdp in tdps:
tdp.rewards = tdp.rewards.flatten()
tdp.not_terminals = tdp.not_terminals.flatten()
trainer.train(tdp, None)
predictor = trainer.predictor()
evaluator.evaluate(predictor)
print(
"Post-Training eval: ",
After Change
tdps = environment.preprocess_samples(samples, self.minibatch_size)
with tempfile.TemporaryDirectory() as tmpdirname:
tmp_path = os.path.join(tmpdirname, "model")
predictor.save(tmp_path, "minidb")
new_predictor = DQNPredictor.load(tmp_path, "minidb", False)
evaluator.evaluate(new_predictor)
print(
"Pre-Training eval: ",
evaluator.mc_loss[-1],
evaluator.value_doubly_robust[-1],
In pattern: SUPERPATTERN
Frequency: 3
Non-data size: 6
Instances
Project Name: facebookresearch/Horizon
Commit Name: 45496de13b7932d8ec860da06f14d113000803be
Time: 2018-08-29
Author: jjg@fb.com
File Name: ml/rl/test/gridworld/test_gridworld_pytorch.py
Class Name: TestGridworld
Method Name: test_reward_boost
Project Name: reinforceio/tensorforce
Commit Name: cd50ec1c075fed30b19771879b818ba14ecfb816
Time: 2020-07-05
Author: alexkuhnle@t-online.de
File Name: test/test_features.py
Class Name: TestFeatures
Method Name: test_pretrain
Project Name: reinforceio/tensorforce
Commit Name: cd50ec1c075fed30b19771879b818ba14ecfb816
Time: 2020-07-05
Author: alexkuhnle@t-online.de
File Name: test/test_saving.py
Class Name: TestSaving
Method Name: test_modules