a7582d472ecd556e5f75e18fb3cf44fa5fce3897,ml/rl/training/sac_trainer.py,SACTrainer,train,#SACTrainer#Any#Any#,107
Before Change
if evaluator is not None:
cpe_stats = BatchStatsForCPE(
td_loss=q1_loss.detach().cpu().numpy(),
logged_rewards=reward.detach().cpu().numpy() ,
model_values_on_logged_actions=q1_value.detach().cpu().numpy(),
model_propensities=actor_output.log_prob.exp().detach().cpu().numpy(),
model_values=min_q_actor_value.detach().cpu().numpy(),
After Change
)
SummaryWriterContext.add_histogram("actor/loss", actor_loss)
self.loss_reporter.report(td_loss=float(q1_loss), reward_loss=None)
if evaluator is not None:
cpe_stats = BatchStatsForCPE(
logged_rewards=reward.detach(),
In pattern: SUPERPATTERN
Frequency: 4
Non-data size: 5
Instances Project Name: facebookresearch/Horizon
Commit Name: a7582d472ecd556e5f75e18fb3cf44fa5fce3897
Time: 2018-11-16
Author: jjg@fb.com
File Name: ml/rl/training/sac_trainer.py
Class Name: SACTrainer
Method Name: train
Project Name: facebookresearch/Horizon
Commit Name: a7582d472ecd556e5f75e18fb3cf44fa5fce3897
Time: 2018-11-16
Author: jjg@fb.com
File Name: ml/rl/training/dqn_trainer.py
Class Name: DQNTrainer
Method Name: train
Project Name: facebookresearch/Horizon
Commit Name: a7582d472ecd556e5f75e18fb3cf44fa5fce3897
Time: 2018-11-16
Author: jjg@fb.com
File Name: ml/rl/training/ddpg_trainer.py
Class Name: DDPGTrainer
Method Name: train
Project Name: facebookresearch/Horizon
Commit Name: a7582d472ecd556e5f75e18fb3cf44fa5fce3897
Time: 2018-11-16
Author: jjg@fb.com
File Name: ml/rl/training/parametric_dqn_trainer.py
Class Name: ParametricDQNTrainer
Method Name: train