a949acef87c6f92589cbd68ff062ecac652539ed,mushroom_rl/solvers/lqr.py,,compute_lqr_Q,#Any#Any#Any#Any#,92
Before Change
sa = np.hstack((s, a))
M = _compute_lqr_Q_matrix(lqr, K)
m = lambda x, y: x.T @ M @ x
return -1. * pairwise_distances(sa, metric=m).diagonal().reshape((-1, 1))
def compute_lqr_Q_gaussian_policy(s, a, lqr, K, Sigma):
After Change
sa = np.hstack((s, a))
M = _compute_lqr_Q_matrix(lqr, K)
return -1. * np.einsum("...k,kl,...l->...", sa, M, sa).reshape(-1, 1)
def compute_lqr_Q_gaussian_policy(s, a, lqr, K, Sigma):
In pattern: SUPERPATTERN
Frequency: 3
Non-data size: 9
Instances
Project Name: AIRLab-POLIMI/mushroom
Commit Name: a949acef87c6f92589cbd68ff062ecac652539ed
Time: 2020-08-18
Author: joao.ac.carvalho@gmail.com
File Name: mushroom_rl/solvers/lqr.py
Class Name:
Method Name: compute_lqr_Q
Project Name: AIRLab-POLIMI/mushroom
Commit Name: a949acef87c6f92589cbd68ff062ecac652539ed
Time: 2020-08-18
Author: joao.ac.carvalho@gmail.com
File Name: mushroom_rl/solvers/lqr.py
Class Name:
Method Name: compute_lqr_V_gaussian_policy_gradient_K
Project Name: AIRLab-POLIMI/mushroom
Commit Name: a949acef87c6f92589cbd68ff062ecac652539ed
Time: 2020-08-18
Author: joao.ac.carvalho@gmail.com
File Name: mushroom_rl/solvers/lqr.py
Class Name:
Method Name: compute_lqr_V