418c54a59b807a9afef43da86c1a810fe9b48856,test/test_optimizers.py,TestOptimizers,test_synchronization,#TestOptimizers#,52
Before Change
def test_synchronization(self):
self.start_tests(name="synchronization")
self.unittest(
policy=dict(network=dict(type="auto", size=8, depth=1, rnn=2)),
optimizer="synchronization",
baseline=dict(network=dict(type="auto", size=8, depth=1, rnn=1)),
baseline_optimizer="adam", baseline_objective="policy_gradient"
)
def test_tf_optimizer(self):
self.start_tests(name="tf-optimizer")
After Change
def test_synchronization(self):
self.start_tests(name="synchronization")
actions = dict(
bool_action=dict(type="bool", shape=(1,)),
int_action=dict(type="int", shape=(2,), num_values=4),
gaussian_action1=dict(type="float", shape=(1, 2), min_value=1.0, max_value=2.0),
gaussian_action2=dict(type="float", shape=(), min_value=-2.0, max_value=1.0)
)
baseline = dict(network=dict(type="auto", size=8, depth=1, rnn=1), distributions=dict(
gaussian_action2=dict(type="gaussian", global_stddev=True)
))
self.unittest(
// Requires same size, but can still vary RNN horizon
actions=actions, baseline=baseline, baseline_optimizer="synchronization",
// Using policy_gradient here, since action_value is covered by DQN
baseline_objective="policy_gradient"
)
def test_tf_optimizer(self):
self.start_tests(name="tf-optimizer")
In pattern: SUPERPATTERN
Frequency: 3
Non-data size: 8
Instances
Project Name: reinforceio/tensorforce
Commit Name: 418c54a59b807a9afef43da86c1a810fe9b48856
Time: 2020-08-17
Author: alexkuhnle@t-online.de
File Name: test/test_optimizers.py
Class Name: TestOptimizers
Method Name: test_synchronization
Project Name: reinforceio/tensorforce
Commit Name: 32e5293feacd55cd694ddea3baebb02a5bebbaed
Time: 2020-08-22
Author: alexkuhnle@t-online.de
File Name: test/test_agents.py
Class Name: TestAgents
Method Name: test_dpg
Project Name: reinforceio/tensorforce
Commit Name: 32e5293feacd55cd694ddea3baebb02a5bebbaed
Time: 2020-08-22
Author: alexkuhnle@t-online.de
File Name: test/test_objectives.py
Class Name: TestObjectives
Method Name: test_deterministic_policy_gradient