45496de13b7932d8ec860da06f14d113000803be,ml/rl/test/gridworld/test_gridworld_pytorch.py,TestGridworld,test_reward_boost,#TestGridworld#,114

Before Change


        )
        self.assertGreater(evaluator.mc_loss[-1], 0.12)

        for _ in range(2):
            for tdp in tdps:
                tdp.rewards = tdp.rewards.flatten()
                tdp.not_terminals = tdp.not_terminals.flatten()
                trainer.train(tdp, None)

        predictor = trainer.predictor()
        evaluator.evaluate(predictor)
        print(
            "Post-Training eval: ",

After Change



        tdps = environment.preprocess_samples(samples, self.minibatch_size)

        with tempfile.TemporaryDirectory() as tmpdirname:
            tmp_path = os.path.join(tmpdirname, "model")
            predictor.save(tmp_path, "minidb")
            new_predictor = DQNPredictor.load(tmp_path, "minidb", False)
            evaluator.evaluate(new_predictor)
        print(
            "Pre-Training eval: ",
            evaluator.mc_loss[-1],
            evaluator.value_doubly_robust[-1],
Italian Trulli
In pattern: SUPERPATTERN

Frequency: 3

Non-data size: 6

Instances


Project Name: facebookresearch/Horizon
Commit Name: 45496de13b7932d8ec860da06f14d113000803be
Time: 2018-08-29
Author: jjg@fb.com
File Name: ml/rl/test/gridworld/test_gridworld_pytorch.py
Class Name: TestGridworld
Method Name: test_reward_boost


Project Name: reinforceio/tensorforce
Commit Name: cd50ec1c075fed30b19771879b818ba14ecfb816
Time: 2020-07-05
Author: alexkuhnle@t-online.de
File Name: test/test_features.py
Class Name: TestFeatures
Method Name: test_pretrain


Project Name: reinforceio/tensorforce
Commit Name: cd50ec1c075fed30b19771879b818ba14ecfb816
Time: 2020-07-05
Author: alexkuhnle@t-online.de
File Name: test/test_saving.py
Class Name: TestSaving
Method Name: test_modules