da6b040e254710f0df907d838db51f4f2cc9bf93,social_rl/multiagent_tfagents/multiagent_ppo.py,MultiagentPPO,get_single_agent_specs,#MultiagentPPO#Any#Any#,217
Before Change
for k in time_step_spec.observation.keys():
if k == "direction":
shape = [1]
elif k == "image":
// Remove agent dimension
shape = time_step_spec.observation[k].shape[1:]
else:
After Change
maximum=spec.maximum,
dtype=spec.dtype)
single_obs_spec = tf.nest.map_structure(make_single_agent_spec,
time_step_spec.observation)
single_reward_spec = tensor_spec.TensorSpec(
shape=(), dtype=time_step_spec.reward.dtype, name="reward")
single_time_step_spec = ts_lib.TimeStep(time_step_spec.step_type,
single_reward_spec,
In pattern: SUPERPATTERN
Frequency: 4
Non-data size: 4
Instances Project Name: google-research/google-research
Commit Name: da6b040e254710f0df907d838db51f4f2cc9bf93
Time: 2021-03-08
Author: ldennis@google.com
File Name: social_rl/multiagent_tfagents/multiagent_ppo.py
Class Name: MultiagentPPO
Method Name: get_single_agent_specs
Project Name: tensorflow/agents
Commit Name: 1bef8a0cb502401e33f8572897d981ef81a1a829
Time: 2020-04-30
Author: bartok@google.com
File Name: tf_agents/bandits/policies/neural_linucb_policy.py
Class Name: NeuralLinUCBPolicy
Method Name: _action
Project Name: tensorflow/agents
Commit Name: b92caeba0b2d531c2ac1e16f595a54222abe6845
Time: 2020-04-23
Author: bartok@google.com
File Name: tf_agents/bandits/policies/linear_bandit_policy.py
Class Name: LinearBanditPolicy
Method Name: _distribution
Project Name: tensorflow/agents
Commit Name: c62215debda5bf5d89723f4112f1e3e2f063cd52
Time: 2020-04-17
Author: kokiopou@google.com
File Name: tf_agents/trajectories/time_step.py
Class Name:
Method Name: termination