fe8d55ae1870b6c7c3725f7ac7cc6b1d1ac0d39e,tensorforce/models/q_model.py,QModel,tf_q_delta,#QModel#Any#Any#Any#Any#,59
Before Change
next_q_value = tf.where(condition=terminal, x=zeros, y=(self.discount * next_q_value))
delta = reward + next_q_value - q_value // tf.stop_gradient(q_target)
collapsed_size = util.prod(util.shape(delta)[1:])
return tf.reshape(tensor=delta, shape=(-1, collapsed_size))
def tf_loss_per_instance(self, states, internals, actions, terminal, reward):
embedding = self.network.apply(
After Change
:return: A list of deltas per action
for _ in range(util.rank(q_value) - 1):
terminal = tf.expand_dims(input=terminal, axis=1)
reward = tf.expand_dims(input=reward, axis=1)
multiples = (1,) + util.shape(q_value)[1:]
terminal = tf.tile(input=terminal, multiples=multiples)
reward = tf.tile(input=reward, multiples=multiples)
In pattern: SUPERPATTERN
Frequency: 3
Non-data size: 5
Instances
Project Name: reinforceio/tensorforce
Commit Name: fe8d55ae1870b6c7c3725f7ac7cc6b1d1ac0d39e
Time: 2017-10-26
Author: aok25@cl.cam.ac.uk
File Name: tensorforce/models/q_model.py
Class Name: QModel
Method Name: tf_q_delta
Project Name: rwth-i6/returnn-experiments
Commit Name: a21861f99e3dc4b778fd776b3e8e00dbaee988ca
Time: 2021-03-27
Author: albzey@gmail.com
File Name: common/models/encoder/blstm_cnn_specaug.py
Class Name:
Method Name: make_net
Project Name: scikit-image/scikit-image
Commit Name: 13df5b1a4687c48abf3cdc1894b100936d7e8f0a
Time: 2019-11-12
Author: r.fezzani@vitadx.com
File Name: skimage/measure/tests/test_marching_cubes.py
Class Name:
Method Name: test_both_algs_same_result_donut