f353943f836ad162ae45a96a404d5db48dba7690,ml/rl/training/parametric_dqn_trainer.py,ParametricDQNTrainer,internal_prediction,#ParametricDQNTrainer#Any#Any#,137
Before Change
self.q_network.eval()
q_values = self.q_network(
rlt.StateAction(
state=rlt.FeatureVector(float_features=state),
action=rlt.FeatureVector(float_features=action),
)
)
self.q_network.train()
return q_values.q_value.cpu()
After Change
self.q_network.eval()
q_values = self.q_network(
rlt.PreprocessedStateAction(state=state, action=action)
)
self.q_network.train()
return q_values.q_value.cpu()
In pattern: SUPERPATTERN
Frequency: 3
Non-data size: 4
Instances
Project Name: facebookresearch/Horizon
Commit Name: f353943f836ad162ae45a96a404d5db48dba7690
Time: 2019-07-15
Author: jjg@fb.com
File Name: ml/rl/training/parametric_dqn_trainer.py
Class Name: ParametricDQNTrainer
Method Name: internal_prediction
Project Name: facebookresearch/Horizon
Commit Name: f353943f836ad162ae45a96a404d5db48dba7690
Time: 2019-07-15
Author: jjg@fb.com
File Name: ml/rl/training/parametric_dqn_trainer.py
Class Name: ParametricDQNTrainer
Method Name: internal_reward_estimation
Project Name: facebookresearch/Horizon
Commit Name: f353943f836ad162ae45a96a404d5db48dba7690
Time: 2019-07-15
Author: jjg@fb.com
File Name: ml/rl/training/td3_trainer.py
Class Name: TD3Trainer
Method Name: train