|
from .exploration import get_epsilon_greedy_fn, create_noise_generator |
|
from .ppo import ppo_data, ppo_loss, ppo_info, ppo_policy_data, ppo_policy_error, ppo_value_data, ppo_value_error, \ |
|
ppo_error, ppo_error_continuous, ppo_policy_error_continuous, ppo_data_continuous, ppo_policy_data_continuous |
|
from .happo import happo_data, happo_policy_data, happo_value_data, happo_loss, happo_policy_loss, happo_info, \ |
|
happo_error, happo_policy_error, happo_value_error, happo_error_continuous, happo_policy_error_continuous |
|
from .ppg import ppg_data, ppg_joint_loss, ppg_joint_error |
|
from .gae import gae_data, gae |
|
from .a2c import a2c_data, a2c_error, a2c_error_continuous |
|
from .coma import coma_data, coma_error |
|
from .td import q_nstep_td_data, q_nstep_td_error, q_1step_td_data, \ |
|
q_1step_td_error, m_q_1step_td_data, m_q_1step_td_error, td_lambda_data, td_lambda_error, \ |
|
q_nstep_td_error_with_rescale, v_1step_td_data, v_1step_td_error, v_nstep_td_data, v_nstep_td_error, \ |
|
generalized_lambda_returns, dist_1step_td_data, dist_1step_td_error, dist_nstep_td_error, dist_nstep_td_data, \ |
|
nstep_return_data, nstep_return, iqn_nstep_td_data, iqn_nstep_td_error, qrdqn_nstep_td_data, qrdqn_nstep_td_error, \ |
|
fqf_nstep_td_data, fqf_nstep_td_error, fqf_calculate_fraction_loss, evaluate_quantile_at_action, \ |
|
q_nstep_sql_td_error, dqfd_nstep_td_error, dqfd_nstep_td_data, q_v_1step_td_error, q_v_1step_td_data, \ |
|
dqfd_nstep_td_error_with_rescale, discount_cumsum, bdq_nstep_td_error |
|
from .vtrace import vtrace_loss, compute_importance_weights |
|
from .upgo import upgo_loss |
|
from .adder import get_gae, get_gae_with_default_last_value, get_nstep_return_data, get_train_sample |
|
from .value_rescale import value_transform, value_inv_transform, symlog, inv_symlog |
|
from .vtrace import vtrace_data, vtrace_error_discrete_action, vtrace_error_continuous_action |
|
from .beta_function import beta_function_map |
|
from .retrace import compute_q_retraces |
|
from .acer import acer_policy_error, acer_value_error, acer_trust_region_update |
|
from .sampler import ArgmaxSampler, MultinomialSampler, MuSampler, ReparameterizationSampler, HybridStochasticSampler, \ |
|
HybridDeterminsticSampler |
|
|