SYMBOL INDEX (405 symbols across 31 files) FILE: algorithms/actor_critic.py class Actor (line 11) | class Actor(nn.Module): method __init__ (line 19) | def __init__(self, args, obs_space, action_space, device=torch.device(... method forward (line 42) | def forward(self, obs, rnn_states, masks, available_actions=None, dete... method evaluate_actions (line 71) | def evaluate_actions(self, obs, rnn_states, action, masks, available_a... class Critic (line 118) | class Critic(nn.Module): method __init__ (line 125) | def __init__(self, args, cent_obs_space, device=torch.device("cpu")): method forward (line 149) | def forward(self, cent_obs, rnn_states, masks): FILE: algorithms/happo_policy.py class HAPPO_Policy (line 6) | class HAPPO_Policy: method __init__ (line 17) | def __init__(self, args, obs_space, cent_obs_space, act_space, device=... method lr_decay (line 46) | def lr_decay(self, episode, episodes): method get_actions (line 55) | def get_actions(self, cent_obs, obs, rnn_states_actor, rnn_states_crit... method get_values (line 83) | def get_values(self, cent_obs, rnn_states_critic, masks): method evaluate_actions (line 95) | def evaluate_actions(self, cent_obs, obs, rnn_states_actor, rnn_states... method act (line 125) | def act(self, obs, rnn_states_actor, masks, available_actions=None, de... FILE: algorithms/happo_trainer.py class HAPPO (line 8) | class HAPPO(): method __init__ (line 15) | def __init__(self, method cal_value_loss (line 48) | def cal_value_loss(self, values, value_preds_batch, return_batch, acti... method ppo_update (line 88) | def ppo_update(self, sample, update_actor=True): method train (line 169) | def train(self, buffer, update_actor=True): method prep_training (line 222) | def prep_training(self): method prep_rollout (line 226) | def prep_rollout(self): FILE: algorithms/hatrpo_policy.py class HATRPO_Policy (line 6) | class HATRPO_Policy: method __init__ (line 17) | def __init__(self, args, obs_space, cent_obs_space, act_space, device=... method lr_decay (line 46) | def lr_decay(self, episode, episodes): method get_actions (line 55) | def get_actions(self, cent_obs, obs, rnn_states_actor, rnn_states_crit... method get_values (line 83) | def get_values(self, cent_obs, rnn_states_critic, masks): method evaluate_actions (line 95) | def evaluate_actions(self, cent_obs, obs, rnn_states_actor, rnn_states... method act (line 125) | def act(self, obs, rnn_states_actor, masks, available_actions=None, de... FILE: algorithms/hatrpo_trainer.py class HATRPO (line 9) | class HATRPO(): method __init__ (line 16) | def __init__(self, method cal_value_loss (line 51) | def cal_value_loss(self, values, value_preds_batch, return_batch, acti... method flat_grad (line 91) | def flat_grad(self, grads): method flat_hessian (line 100) | def flat_hessian(self, hessians): method flat_params (line 109) | def flat_params(self, model): method update_model (line 116) | def update_model(self, model, new_params): method kl_approx (line 125) | def kl_approx(self, q, p): method kl_divergence (line 130) | def kl_divergence(self, obs, rnn_states, action, masks, available_acti... method conjugate_gradient (line 152) | def conjugate_gradient(self, actor, obs, rnn_states, action, masks, av... method fisher_vector_product (line 170) | def fisher_vector_product(self, actor, obs, rnn_states, action, masks,... method trpo_update (line 181) | def trpo_update(self, sample, update_actor=True): method train (line 321) | def train(self, buffer, update_actor=True): method prep_training (line 378) | def prep_training(self): method prep_rollout (line 382) | def prep_rollout(self): FILE: algorithms/utils/act.py class ACTLayer (line 5) | class ACTLayer(nn.Module): method __init__ (line 13) | def __init__(self, action_space, inputs_dim, use_orthogonal, gain, arg... method forward (line 41) | def forward(self, x, available_actions=None, deterministic=False): method get_probs (line 85) | def get_probs(self, x, available_actions=None): method evaluate_actions (line 107) | def evaluate_actions(self, x, action, available_actions=None, active_m... method evaluate_actions_trpo (line 167) | def evaluate_actions_trpo(self, x, action, available_actions=None, act... FILE: algorithms/utils/cnn.py class Flatten (line 6) | class Flatten(nn.Module): method forward (line 7) | def forward(self, x): class CNNLayer (line 11) | class CNNLayer(nn.Module): method __init__ (line 12) | def __init__(self, obs_shape, hidden_size, use_orthogonal, use_ReLU, k... method forward (line 40) | def forward(self, x): class CNNBase (line 46) | class CNNBase(nn.Module): method __init__ (line 47) | def __init__(self, args, obs_shape): method forward (line 56) | def forward(self, x): FILE: algorithms/utils/distributions.py class FixedCategorical (line 14) | class FixedCategorical(torch.distributions.Categorical): method sample (line 15) | def sample(self): method log_probs (line 18) | def log_probs(self, actions): method mode (line 27) | def mode(self): class FixedNormal (line 32) | class FixedNormal(torch.distributions.Normal): method log_probs (line 33) | def log_probs(self, actions): method entrop (line 37) | def entrop(self): method mode (line 40) | def mode(self): class FixedBernoulli (line 45) | class FixedBernoulli(torch.distributions.Bernoulli): method log_probs (line 46) | def log_probs(self, actions): method entropy (line 49) | def entropy(self): method mode (line 52) | def mode(self): class Categorical (line 56) | class Categorical(nn.Module): method __init__ (line 57) | def __init__(self, num_inputs, num_outputs, use_orthogonal=True, gain=... method forward (line 65) | def forward(self, x, available_actions=None): class DiagGaussian (line 94) | class DiagGaussian(nn.Module): method __init__ (line 95) | def __init__(self, num_inputs, num_outputs, use_orthogonal=True, gain=... method forward (line 113) | def forward(self, x, available_actions=None): class Bernoulli (line 118) | class Bernoulli(nn.Module): method __init__ (line 119) | def __init__(self, num_inputs, num_outputs, use_orthogonal=True, gain=... method forward (line 127) | def forward(self, x): class AddBias (line 131) | class AddBias(nn.Module): method __init__ (line 132) | def __init__(self, bias): method forward (line 136) | def forward(self, x): FILE: algorithms/utils/mlp.py class MLPLayer (line 6) | class MLPLayer(nn.Module): method __init__ (line 7) | def __init__(self, input_dim, hidden_size, layer_N, use_orthogonal, us... method forward (line 26) | def forward(self, x): class MLPBase (line 33) | class MLPBase(nn.Module): method __init__ (line 34) | def __init__(self, args, obs_shape, cat_self=True, attn_internal=False): method forward (line 52) | def forward(self, x): FILE: algorithms/utils/rnn.py class RNNLayer (line 7) | class RNNLayer(nn.Module): method __init__ (line 8) | def __init__(self, inputs_dim, outputs_dim, recurrent_N, use_orthogonal): method forward (line 24) | def forward(self, x, hxs, masks): FILE: algorithms/utils/util.py function init (line 7) | def init(module, weight_init, bias_init, gain=1): function get_clones (line 12) | def get_clones(module, N): function check (line 15) | def check(input): FILE: configs/config.py function get_config (line 3) | def get_config(): FILE: envs/env_wrappers.py class CloudpickleWrapper (line 10) | class CloudpickleWrapper(object): method __init__ (line 15) | def __init__(self, x): method __getstate__ (line 18) | def __getstate__(self): method __setstate__ (line 22) | def __setstate__(self, ob): class ShareVecEnv (line 27) | class ShareVecEnv(ABC): method __init__ (line 41) | def __init__(self, num_envs, observation_space, share_observation_spac... method reset (line 48) | def reset(self): method step_async (line 60) | def step_async(self, actions): method step_wait (line 72) | def step_wait(self): method close_extras (line 85) | def close_extras(self): method close (line 92) | def close(self): method step (line 100) | def step(self, actions): method render (line 109) | def render(self, mode='human'): method get_images (line 120) | def get_images(self): method unwrapped (line 127) | def unwrapped(self): method get_viewer (line 133) | def get_viewer(self): function worker (line 140) | def worker(remote, parent_remote, env_fn_wrapper): class GuardSubprocVecEnv (line 177) | class GuardSubprocVecEnv(ShareVecEnv): method __init__ (line 178) | def __init__(self, env_fns, spaces=None): method step_async (line 199) | def step_async(self, actions): method step_wait (line 205) | def step_wait(self): method reset (line 211) | def reset(self): method reset_task (line 217) | def reset_task(self): method close (line 222) | def close(self): class SubprocVecEnv (line 235) | class SubprocVecEnv(ShareVecEnv): method __init__ (line 236) | def __init__(self, env_fns, spaces=None): method step_async (line 257) | def step_async(self, actions): method step_wait (line 262) | def step_wait(self): method reset (line 268) | def reset(self): method reset_task (line 275) | def reset_task(self): method close (line 280) | def close(self): method render (line 292) | def render(self, mode="rgb_array"): function shareworker (line 300) | def shareworker(remote, parent_remote, env_fn_wrapper): class ShareSubprocVecEnv (line 343) | class ShareSubprocVecEnv(ShareVecEnv): method __init__ (line 344) | def __init__(self, env_fns, spaces=None): method step_async (line 367) | def step_async(self, actions): method step_wait (line 372) | def step_wait(self): method reset (line 378) | def reset(self): method reset_task (line 385) | def reset_task(self): method close (line 390) | def close(self): function choosesimpleworker (line 403) | def choosesimpleworker(remote, parent_remote, env_fn_wrapper): class ChooseSimpleSubprocVecEnv (line 434) | class ChooseSimpleSubprocVecEnv(ShareVecEnv): method __init__ (line 435) | def __init__(self, env_fns, spaces=None): method step_async (line 455) | def step_async(self, actions): method step_wait (line 460) | def step_wait(self): method reset (line 466) | def reset(self, reset_choose): method render (line 472) | def render(self, mode="rgb_array"): method reset_task (line 479) | def reset_task(self): method close (line 484) | def close(self): function chooseworker (line 497) | def chooseworker(remote, parent_remote, env_fn_wrapper): class ChooseSubprocVecEnv (line 524) | class ChooseSubprocVecEnv(ShareVecEnv): method __init__ (line 525) | def __init__(self, env_fns, spaces=None): method step_async (line 546) | def step_async(self, actions): method step_wait (line 551) | def step_wait(self): method reset (line 557) | def reset(self, reset_choose): method reset_task (line 564) | def reset_task(self): method close (line 569) | def close(self): function chooseguardworker (line 582) | def chooseguardworker(remote, parent_remote, env_fn_wrapper): class ChooseGuardSubprocVecEnv (line 607) | class ChooseGuardSubprocVecEnv(ShareVecEnv): method __init__ (line 608) | def __init__(self, env_fns, spaces=None): method step_async (line 629) | def step_async(self, actions): method step_wait (line 634) | def step_wait(self): method reset (line 640) | def reset(self, reset_choose): method reset_task (line 646) | def reset_task(self): method close (line 651) | def close(self): class DummyVecEnv (line 665) | class DummyVecEnv(ShareVecEnv): method __init__ (line 666) | def __init__(self, env_fns): method step_async (line 673) | def step_async(self, actions): method step_wait (line 676) | def step_wait(self): method reset (line 691) | def reset(self): method close (line 695) | def close(self): method render (line 699) | def render(self, mode="human"): class ShareDummyVecEnv (line 710) | class ShareDummyVecEnv(ShareVecEnv): method __init__ (line 711) | def __init__(self, env_fns): method step_async (line 718) | def step_async(self, actions): method step_wait (line 721) | def step_wait(self): method reset (line 737) | def reset(self): method close (line 742) | def close(self): method render (line 746) | def render(self, mode="human"): class ChooseDummyVecEnv (line 756) | class ChooseDummyVecEnv(ShareVecEnv): method __init__ (line 757) | def __init__(self, env_fns): method step_async (line 764) | def step_async(self, actions): method step_wait (line 767) | def step_wait(self): method reset (line 774) | def reset(self, reset_choose): method close (line 780) | def close(self): method render (line 784) | def render(self, mode="human"): class ChooseSimpleDummyVecEnv (line 793) | class ChooseSimpleDummyVecEnv(ShareVecEnv): method __init__ (line 794) | def __init__(self, env_fns): method step_async (line 801) | def step_async(self, actions): method step_wait (line 804) | def step_wait(self): method reset (line 810) | def reset(self, reset_choose): method close (line 815) | def close(self): method render (line 819) | def render(self, mode="human"): FILE: envs/ma_mujoco/multiagent_mujoco/coupled_half_cheetah.py class CoupledHalfCheetah (line 7) | class CoupledHalfCheetah(mujoco_env.MujocoEnv, utils.EzPickle): method __init__ (line 8) | def __init__(self, **kwargs): method step (line 12) | def step(self, action): method _get_obs (line 28) | def _get_obs(self): method reset_model (line 34) | def reset_model(self): method viewer_setup (line 40) | def viewer_setup(self): method get_env_info (line 43) | def get_env_info(self): FILE: envs/ma_mujoco/multiagent_mujoco/manyagent_ant.py class ManyAgentAntEnv (line 7) | class ManyAgentAntEnv(mujoco_env.MujocoEnv, utils.EzPickle): method __init__ (line 8) | def __init__(self, **kwargs): method _generate_asset (line 28) | def _generate_asset(self, n_segs, asset_path): method step (line 81) | def step(self, a): method _get_obs (line 102) | def _get_obs(self): method reset_model (line 109) | def reset_model(self): method viewer_setup (line 115) | def viewer_setup(self): FILE: envs/ma_mujoco/multiagent_mujoco/manyagent_swimmer.py class ManyAgentSwimmerEnv (line 7) | class ManyAgentSwimmerEnv(mujoco_env.MujocoEnv, utils.EzPickle): method __init__ (line 8) | def __init__(self, **kwargs): method _generate_asset (line 28) | def _generate_asset(self, n_segs, asset_path): method step (line 64) | def step(self, a): method _get_obs (line 75) | def _get_obs(self): method reset_model (line 80) | def reset_model(self): FILE: envs/ma_mujoco/multiagent_mujoco/mujoco_multi.py function env_fn (line 12) | def env_fn(env, **kwargs) -> MultiAgentEnv: # TODO: this may be a more c... class NormalizedActions (line 21) | class NormalizedActions(gym.ActionWrapper): method _action (line 23) | def _action(self, action): method action (line 29) | def action(self, action_): method _reverse_action (line 32) | def _reverse_action(self, action): class MujocoMulti (line 39) | class MujocoMulti(MultiAgentEnv): method __init__ (line 41) | def __init__(self, batch_size=None, **kwargs): method step (line 120) | def step(self, actions): method get_obs (line 147) | def get_obs(self): method get_obs_agent (line 162) | def get_obs_agent(self, agent_id): method get_obs_size (line 178) | def get_obs_size(self): method get_state (line 186) | def get_state(self, team=None): method get_state_size (line 199) | def get_state_size(self): method get_avail_actions (line 203) | def get_avail_actions(self): # all actions are always available method get_avail_agent_actions (line 206) | def get_avail_agent_actions(self, agent_id): method get_total_actions (line 210) | def get_total_actions(self): method get_stats (line 215) | def get_stats(self): method get_agg_stats (line 219) | def get_agg_stats(self, stats): method reset (line 222) | def reset(self, **kwargs): method render (line 228) | def render(self, **kwargs): method close (line 231) | def close(self): method seed (line 234) | def seed(self, args): method get_env_info (line 237) | def get_env_info(self): FILE: envs/ma_mujoco/multiagent_mujoco/multiagentenv.py function convert (line 5) | def convert(dictionary): class MultiAgentEnv (line 8) | class MultiAgentEnv(object): method __init__ (line 10) | def __init__(self, batch_size=None, **kwargs): method step (line 21) | def step(self, actions): method get_obs (line 25) | def get_obs(self): method get_obs_agent (line 29) | def get_obs_agent(self, agent_id): method get_obs_size (line 33) | def get_obs_size(self): method get_state (line 37) | def get_state(self): method get_state_size (line 40) | def get_state_size(self): method get_avail_actions (line 44) | def get_avail_actions(self): method get_avail_agent_actions (line 47) | def get_avail_agent_actions(self, agent_id): method get_total_actions (line 51) | def get_total_actions(self): method get_stats (line 56) | def get_stats(self): method get_agg_stats (line 60) | def get_agg_stats(self, stats): method reset (line 63) | def reset(self): method render (line 67) | def render(self): method close (line 70) | def close(self): method seed (line 73) | def seed(self, seed): method get_env_info (line 76) | def get_env_info(self): FILE: envs/ma_mujoco/multiagent_mujoco/obsk.py class Node (line 5) | class Node(): method __init__ (line 6) | def __init__(self, label, qpos_ids, qvel_ids, act_ids, body_fn=None, b... method __str__ (line 17) | def __str__(self): method __repr__ (line 20) | def __repr__(self): class HyperEdge (line 24) | class HyperEdge(): method __init__ (line 25) | def __init__(self, *edges): method __contains__ (line 28) | def __contains__(self, item): method __str__ (line 31) | def __str__(self): method __repr__ (line 34) | def __repr__(self): function get_joints_at_kdist (line 38) | def get_joints_at_kdist(agent_id, agent_partitions, hyperedges, k=0, kag... function build_obs (line 74) | def build_obs(env, k_dict, k_categories, global_dict, global_categories,... function build_actions (line 141) | def build_actions(agent_partitions, k_dict): function get_parts_and_edges (line 146) | def get_parts_and_edges(label, partitioning): FILE: envs/starcraft2/StarCraft2_Env.py class Direction (line 56) | class Direction(enum.IntEnum): class StarCraft2Env (line 63) | class StarCraft2Env(MultiAgentEnv): method __init__ (line 68) | def __init__( method _launch (line 330) | def _launch(self): method reset (line 381) | def reset(self): method _restart (line 438) | def _restart(self): method full_restart (line 449) | def full_restart(self): method step (line 455) | def step(self, actions): method get_agent_action (line 617) | def get_agent_action(self, a_id, action): method get_agent_action_heuristic (line 712) | def get_agent_action_heuristic(self, a_id, action): method reward_battle (line 809) | def reward_battle(self): method get_total_actions (line 866) | def get_total_actions(self): method distance (line 871) | def distance(x1, y1, x2, y2): method unit_shoot_range (line 875) | def unit_shoot_range(self, agent_id): method unit_sight_range (line 879) | def unit_sight_range(self, agent_id): method unit_max_cooldown (line 883) | def unit_max_cooldown(self, unit): method save_replay (line 898) | def save_replay(self): method unit_max_shield (line 906) | def unit_max_shield(self, unit): method can_move (line 915) | def can_move(self, unit, direction): method get_surrounding_points (line 933) | def get_surrounding_points(self, unit, include_self=False): method check_bounds (line 956) | def check_bounds(self, x, y): method get_surrounding_pathing (line 960) | def get_surrounding_pathing(self, unit): method get_surrounding_height (line 969) | def get_surrounding_height(self, unit): method get_obs_agent (line 978) | def get_obs_agent(self, agent_id): method get_obs (line 1144) | def get_obs(self): method get_state (line 1152) | def get_state(self, agent_id=-1): method get_state_agent (line 1327) | def get_state_agent(self, agent_id): method get_obs_enemy_feats_size (line 1522) | def get_obs_enemy_feats_size(self): method get_state_enemy_feats_size (line 1533) | def get_state_enemy_feats_size(self): method get_obs_ally_feats_size (line 1547) | def get_obs_ally_feats_size(self): method get_state_ally_feats_size (line 1561) | def get_state_ally_feats_size(self): method get_obs_own_feats_size (line 1578) | def get_obs_own_feats_size(self): method get_state_own_feats_size (line 1590) | def get_state_own_feats_size(self): method get_obs_move_feats_size (line 1605) | def get_obs_move_feats_size(self): method get_state_move_feats_size (line 1615) | def get_state_move_feats_size(self): method get_obs_size (line 1625) | def get_obs_size(self): method get_state_size (line 1651) | def get_state_size(self): method get_visibility_matrix (line 1737) | def get_visibility_matrix(self): method get_unit_type_id (line 1778) | def get_unit_type_id(self, unit, ally): method get_avail_agent_actions (line 1809) | def get_avail_agent_actions(self, agent_id): method get_avail_actions (line 1855) | def get_avail_actions(self): method close (line 1863) | def close(self): method seed (line 1868) | def seed(self, seed): method render (line 1872) | def render(self): method _kill_all_units (line 1876) | def _kill_all_units(self): method init_units (line 1886) | def init_units(self): method update_units (line 1941) | def update_units(self): method _init_ally_unit_types (line 1987) | def _init_ally_unit_types(self, min_unit_type): method only_medivac_left (line 2017) | def only_medivac_left(self, ally): method get_unit_by_id (line 2041) | def get_unit_by_id(self, a_id): method get_stats (line 2045) | def get_stats(self): FILE: envs/starcraft2/multiagentenv.py class MultiAgentEnv (line 6) | class MultiAgentEnv(object): method step (line 8) | def step(self, actions): method get_obs (line 12) | def get_obs(self): method get_obs_agent (line 16) | def get_obs_agent(self, agent_id): method get_obs_size (line 20) | def get_obs_size(self): method get_state (line 24) | def get_state(self): method get_state_size (line 28) | def get_state_size(self): method get_avail_actions (line 32) | def get_avail_actions(self): method get_avail_agent_actions (line 36) | def get_avail_agent_actions(self, agent_id): method get_total_actions (line 40) | def get_total_actions(self): method reset (line 44) | def reset(self): method render (line 48) | def render(self): method close (line 51) | def close(self): method seed (line 54) | def seed(self): method save_replay (line 57) | def save_replay(self): method get_env_info (line 61) | def get_env_info(self): FILE: envs/starcraft2/smac_maps.py class SMACMap (line 8) | class SMACMap(lib.Map): function get_smac_map_registry (line 448) | def get_smac_map_registry(): function get_map_params (line 456) | def get_map_params(map_name): FILE: runners/separated/base_runner.py function _t2n (line 11) | def _t2n(x): class Runner (line 14) | class Runner(object): method __init__ (line 15) | def __init__(self, config): method run (line 105) | def run(self): method warmup (line 108) | def warmup(self): method collect (line 111) | def collect(self, step): method insert (line 114) | def insert(self, data): method compute (line 118) | def compute(self): method train (line 127) | def train(self): method save (line 177) | def save(self): method restore (line 188) | def restore(self): method log_train (line 199) | def log_train(self, train_infos, total_num_steps): method log_env (line 205) | def log_env(self, env_infos, total_num_steps): FILE: runners/separated/mujoco_runner.py function _t2n (line 8) | def _t2n(x): class MujocoRunner (line 12) | class MujocoRunner(Runner): method __init__ (line 15) | def __init__(self, config): method run (line 18) | def run(self): method warmup (line 89) | def warmup(self): method collect (line 101) | def collect(self, step): method insert (line 129) | def insert(self, data): method log_train (line 157) | def log_train(self, train_infos, total_num_steps): method eval (line 166) | def eval(self, total_num_steps): FILE: runners/separated/smac_runner.py function _t2n (line 7) | def _t2n(x): class SMACRunner (line 10) | class SMACRunner(Runner): method __init__ (line 12) | def __init__(self, config): method run (line 15) | def run(self): method warmup (line 95) | def warmup(self): method collect (line 107) | def collect(self, step): method insert (line 136) | def insert(self, data): method log_train (line 162) | def log_train(self, train_infos, total_num_steps): method eval (line 170) | def eval(self, total_num_steps): FILE: scripts/train/train_mujoco.py function make_train_env (line 17) | def make_train_env(all_args): function make_eval_env (line 40) | def make_eval_env(all_args): function parse_args (line 63) | def parse_args(args, parser): function main (line 86) | def main(args): FILE: scripts/train/train_smac.py function make_train_env (line 17) | def make_train_env(all_args): function make_eval_env (line 36) | def make_eval_env(all_args): function parse_args (line 55) | def parse_args(args, parser): function main (line 73) | def main(args): FILE: utils/multi_discrete.py class MultiDiscrete (line 6) | class MultiDiscrete(gym.Space): method __init__ (line 22) | def __init__(self, array_of_param_array): method sample (line 28) | def sample(self): method contains (line 34) | def contains(self, x): method shape (line 38) | def shape(self): method __repr__ (line 41) | def __repr__(self): method __eq__ (line 44) | def __eq__(self, other): FILE: utils/popart.py class PopArt (line 8) | class PopArt(nn.Module): method __init__ (line 11) | def __init__(self, input_shape, norm_axes=1, beta=0.99999, per_element... method reset_parameters (line 25) | def reset_parameters(self): method running_mean_var (line 30) | def running_mean_var(self): method forward (line 36) | def forward(self, input_vector, train=True): method denormalize (line 64) | def denormalize(self, input_vector): FILE: utils/separated_buffer.py function _flatten (line 6) | def _flatten(T, N, x): function _cast (line 9) | def _cast(x): class SeparatedReplayBuffer (line 12) | class SeparatedReplayBuffer(object): method __init__ (line 13) | def __init__(self, args, obs_space, share_obs_space, act_space): method update_factor (line 64) | def update_factor(self, factor): method insert (line 67) | def insert(self, share_obs, obs, rnn_states, rnn_states_critic, action... method chooseinsert (line 87) | def chooseinsert(self, share_obs, obs, rnn_states, rnn_states_critic, ... method after_update (line 107) | def after_update(self): method chooseafter_update (line 118) | def chooseafter_update(self): method compute_returns (line 124) | def compute_returns(self, next_value, value_normalizer=None): method feed_forward_generator (line 171) | def feed_forward_generator(self, advantages, num_mini_batch=None, mini... method naive_recurrent_generator (line 231) | def naive_recurrent_generator(self, advantages, num_mini_batch): method recurrent_generator (line 313) | def recurrent_generator(self, advantages, num_mini_batch, data_chunk_l... FILE: utils/util.py function check (line 5) | def check(input): function get_gard_norm (line 9) | def get_gard_norm(it): function update_linear_schedule (line 17) | def update_linear_schedule(optimizer, epoch, total_num_epochs, initial_lr): function huber_loss (line 23) | def huber_loss(e, d): function mse_loss (line 28) | def mse_loss(e): function get_shape_from_obs_space (line 31) | def get_shape_from_obs_space(obs_space): function get_shape_from_act_space (line 40) | def get_shape_from_act_space(act_space): function tile_images (line 54) | def tile_images(img_nhwc):