SYMBOL INDEX (796 symbols across 72 files) FILE: MACPO/macpo/algorithms/r_mappo/__init__.py function cost_trpo_macppo (line 1) | def cost_trpo_macppo(): FILE: MACPO/macpo/algorithms/r_mappo/algorithm/MACPPOPolicy.py class MACPPOPolicy (line 6) | class MACPPOPolicy: method __init__ (line 17) | def __init__(self, args, obs_space, cent_obs_space, act_space, device=... method lr_decay (line 45) | def lr_decay(self, episode, episodes): method get_actions (line 55) | def get_actions(self, cent_obs, obs, rnn_states_actor, rnn_states_crit... method get_values (line 88) | def get_values(self, cent_obs, rnn_states_critic, masks): method get_cost_values (line 100) | def get_cost_values(self, cent_obs, rnn_states_cost, masks): method evaluate_actions (line 112) | def evaluate_actions(self, cent_obs, obs, rnn_states_actor, rnn_states... method act (line 157) | def act(self, obs, rnn_states_actor, masks, available_actions=None, de... FILE: MACPO/macpo/algorithms/r_mappo/algorithm/rMAPPOPolicy.py class R_MAPPOPolicy (line 6) | class R_MAPPOPolicy: method __init__ (line 17) | def __init__(self, args, obs_space, cent_obs_space, act_space, device=... method lr_decay (line 39) | def lr_decay(self, episode, episodes): method get_actions (line 48) | def get_actions(self, cent_obs, obs, rnn_states_actor, rnn_states_crit... method get_values (line 76) | def get_values(self, cent_obs, rnn_states_critic, masks): method evaluate_actions (line 88) | def evaluate_actions(self, cent_obs, obs, rnn_states_actor, rnn_states... method act (line 116) | def act(self, obs, rnn_states_actor, masks, available_actions=None, de... FILE: MACPO/macpo/algorithms/r_mappo/algorithm/r_actor_critic.py class R_Actor (line 11) | class R_Actor(nn.Module): method __init__ (line 19) | def __init__(self, args, obs_space, action_space, device=torch.device(... method forward (line 43) | def forward(self, obs, rnn_states, masks, available_actions=None, dete... method evaluate_actions (line 72) | def evaluate_actions(self, obs, rnn_states, action, masks, available_a... class R_Critic (line 125) | class R_Critic(nn.Module): method __init__ (line 133) | def __init__(self, args, cent_obs_space, device=torch.device("cpu")): method forward (line 157) | def forward(self, cent_obs, rnn_states, masks): FILE: MACPO/macpo/algorithms/r_mappo/r_macpo.py class R_MACTRPO_CPO (line 14) | class R_MACTRPO_CPO(): method __init__ (line 22) | def __init__(self, method cal_value_loss (line 124) | def cal_value_loss(self, values, value_preds_batch, return_batch, acti... method flat_grad (line 164) | def flat_grad(self, grads): method flat_hessian (line 173) | def flat_hessian(self, hessians): method flat_params (line 182) | def flat_params(self, model): method update_model (line 189) | def update_model(self, model, new_params): method kl_divergence (line 198) | def kl_divergence(self, obs, rnn_states, action, masks, available_acti... method conjugate_gradient (line 218) | def conjugate_gradient(self, actor, obs, rnn_states, action, masks, av... method fisher_vector_product (line 237) | def fisher_vector_product(self, actor, obs, rnn_states, action, masks,... method _get_flat_grad (line 251) | def _get_flat_grad(self, y, model, retain_graph=None, create_graph=Fal... method _flat_grad_ (line 262) | def _flat_grad_(self, f, model, retain_graph=None, create_graph=False): method hessian_vector_product (line 266) | def hessian_vector_product(self, f, model): method cg (line 274) | def cg(self, Ax, b, cg_iters=10): method trpo_update (line 289) | def trpo_update(self, sample, update_actor=True): method train (line 565) | def train(self, buffer, shared_buffer=None, update_actor=True): method prep_training (line 657) | def prep_training(self): method prep_rollout (line 661) | def prep_rollout(self): FILE: MACPO/macpo/algorithms/utils/act.py class ACTLayer (line 5) | class ACTLayer(nn.Module): method __init__ (line 13) | def __init__(self, action_space, inputs_dim, use_orthogonal, gain, arg... method forward (line 41) | def forward(self, x, available_actions=None, deterministic=False): method get_probs (line 85) | def get_probs(self, x, available_actions=None): method evaluate_actions (line 107) | def evaluate_actions(self, x, action, available_actions=None, active_m... method evaluate_actions_trpo (line 165) | def evaluate_actions_trpo(self, x, action, available_actions=None, act... FILE: MACPO/macpo/algorithms/utils/cnn.py class Flatten (line 6) | class Flatten(nn.Module): method forward (line 7) | def forward(self, x): class CNNLayer (line 11) | class CNNLayer(nn.Module): method __init__ (line 12) | def __init__(self, obs_shape, hidden_size, use_orthogonal, use_ReLU, k... method forward (line 40) | def forward(self, x): class CNNBase (line 46) | class CNNBase(nn.Module): method __init__ (line 47) | def __init__(self, args, obs_shape): method forward (line 56) | def forward(self, x): FILE: MACPO/macpo/algorithms/utils/distributions.py class FixedCategorical (line 14) | class FixedCategorical(torch.distributions.Categorical): method sample (line 15) | def sample(self): method log_probs (line 18) | def log_probs(self, actions): method mode (line 27) | def mode(self): class FixedNormal (line 32) | class FixedNormal(torch.distributions.Normal): method log_probs (line 33) | def log_probs(self, actions): method entrop (line 37) | def entrop(self): method mode (line 40) | def mode(self): class FixedBernoulli (line 45) | class FixedBernoulli(torch.distributions.Bernoulli): method log_probs (line 46) | def log_probs(self, actions): method entropy (line 49) | def entropy(self): method mode (line 52) | def mode(self): class Categorical (line 56) | class Categorical(nn.Module): method __init__ (line 57) | def __init__(self, num_inputs, num_outputs, use_orthogonal=True, gain=... method forward (line 65) | def forward(self, x, available_actions=None): class DiagGaussian (line 94) | class DiagGaussian(nn.Module): method __init__ (line 95) | def __init__(self, num_inputs, num_outputs, use_orthogonal=True, gain=... method forward (line 113) | def forward(self, x, available_actions=None): class Bernoulli (line 125) | class Bernoulli(nn.Module): method __init__ (line 126) | def __init__(self, num_inputs, num_outputs, use_orthogonal=True, gain=... method forward (line 134) | def forward(self, x): class AddBias (line 138) | class AddBias(nn.Module): method __init__ (line 139) | def __init__(self, bias): method forward (line 143) | def forward(self, x): FILE: MACPO/macpo/algorithms/utils/mlp.py class MLPLayer (line 6) | class MLPLayer(nn.Module): method __init__ (line 7) | def __init__(self, input_dim, hidden_size, layer_N, use_orthogonal, us... method forward (line 27) | def forward(self, x): class MLPBase (line 34) | class MLPBase(nn.Module): method __init__ (line 35) | def __init__(self, args, obs_shape, cat_self=True, attn_internal=False): method forward (line 53) | def forward(self, x): FILE: MACPO/macpo/algorithms/utils/rnn.py class RNNLayer (line 7) | class RNNLayer(nn.Module): method __init__ (line 8) | def __init__(self, inputs_dim, outputs_dim, recurrent_N, use_orthogonal): method forward (line 24) | def forward(self, x, hxs, masks): FILE: MACPO/macpo/algorithms/utils/util.py function init (line 7) | def init(module, weight_init, bias_init, gain=1): function get_clones (line 12) | def get_clones(module, N): function check (line 15) | def check(input): FILE: MACPO/macpo/config.py function get_config (line 4) | def get_config(): FILE: MACPO/macpo/envs/env_wrappers.py class CloudpickleWrapper (line 10) | class CloudpickleWrapper(object): method __init__ (line 15) | def __init__(self, x): method __getstate__ (line 18) | def __getstate__(self): method __setstate__ (line 22) | def __setstate__(self, ob): class ShareVecEnv (line 27) | class ShareVecEnv(ABC): method __init__ (line 41) | def __init__(self, num_envs, observation_space, share_observation_spac... method reset (line 48) | def reset(self): method step_async (line 60) | def step_async(self, actions): method step_wait (line 72) | def step_wait(self): method close_extras (line 86) | def close_extras(self): method close (line 93) | def close(self): method step (line 101) | def step(self, actions): method render (line 110) | def render(self, mode='human'): method get_images (line 121) | def get_images(self): method unwrapped (line 128) | def unwrapped(self): method get_viewer (line 134) | def get_viewer(self): function worker (line 141) | def worker(remote, parent_remote, env_fn_wrapper): class GuardSubprocVecEnv (line 178) | class GuardSubprocVecEnv(ShareVecEnv): method __init__ (line 179) | def __init__(self, env_fns, spaces=None): method step_async (line 200) | def step_async(self, actions): method step_wait (line 206) | def step_wait(self): method reset (line 212) | def reset(self): method reset_task (line 218) | def reset_task(self): method close (line 223) | def close(self): class SubprocVecEnv (line 236) | class SubprocVecEnv(ShareVecEnv): method __init__ (line 237) | def __init__(self, env_fns, spaces=None): method step_async (line 258) | def step_async(self, actions): method step_wait (line 263) | def step_wait(self): method reset (line 269) | def reset(self): method reset_task (line 276) | def reset_task(self): method close (line 281) | def close(self): method render (line 293) | def render(self, mode="rgb_array"): function shareworker (line 301) | def shareworker(remote, parent_remote, env_fn_wrapper): class ShareSubprocVecEnv (line 344) | class ShareSubprocVecEnv(ShareVecEnv): method __init__ (line 345) | def __init__(self, env_fns, spaces=None): method step_async (line 369) | def step_async(self, actions): method step_wait (line 374) | def step_wait(self): method reset (line 384) | def reset(self): method reset_task (line 391) | def reset_task(self): method close (line 396) | def close(self): function choosesimpleworker (line 409) | def choosesimpleworker(remote, parent_remote, env_fn_wrapper): class ChooseSimpleSubprocVecEnv (line 440) | class ChooseSimpleSubprocVecEnv(ShareVecEnv): method __init__ (line 441) | def __init__(self, env_fns, spaces=None): method step_async (line 461) | def step_async(self, actions): method step_wait (line 466) | def step_wait(self): method reset (line 472) | def reset(self, reset_choose): method render (line 478) | def render(self, mode="rgb_array"): method reset_task (line 485) | def reset_task(self): method close (line 490) | def close(self): function chooseworker (line 503) | def chooseworker(remote, parent_remote, env_fn_wrapper): class ChooseSubprocVecEnv (line 530) | class ChooseSubprocVecEnv(ShareVecEnv): method __init__ (line 531) | def __init__(self, env_fns, spaces=None): method step_async (line 552) | def step_async(self, actions): method step_wait (line 557) | def step_wait(self): method reset (line 563) | def reset(self, reset_choose): method reset_task (line 570) | def reset_task(self): method close (line 575) | def close(self): function chooseguardworker (line 588) | def chooseguardworker(remote, parent_remote, env_fn_wrapper): class ChooseGuardSubprocVecEnv (line 613) | class ChooseGuardSubprocVecEnv(ShareVecEnv): method __init__ (line 614) | def __init__(self, env_fns, spaces=None): method step_async (line 635) | def step_async(self, actions): method step_wait (line 640) | def step_wait(self): method reset (line 646) | def reset(self, reset_choose): method reset_task (line 652) | def reset_task(self): method close (line 657) | def close(self): class DummyVecEnv (line 671) | class DummyVecEnv(ShareVecEnv): method __init__ (line 672) | def __init__(self, env_fns): method step_async (line 679) | def step_async(self, actions): method step_wait (line 682) | def step_wait(self): method reset (line 697) | def reset(self): method close (line 701) | def close(self): method render (line 705) | def render(self, mode="human"): class ShareDummyVecEnv (line 716) | class ShareDummyVecEnv(ShareVecEnv): method __init__ (line 717) | def __init__(self, env_fns): method step_async (line 724) | def step_async(self, actions): method step_wait (line 727) | def step_wait(self): method reset (line 743) | def reset(self): method close (line 748) | def close(self): method render (line 752) | def render(self, mode="human"): class ChooseDummyVecEnv (line 762) | class ChooseDummyVecEnv(ShareVecEnv): method __init__ (line 763) | def __init__(self, env_fns): method step_async (line 770) | def step_async(self, actions): method step_wait (line 773) | def step_wait(self): method reset (line 780) | def reset(self, reset_choose): method close (line 786) | def close(self): method render (line 790) | def render(self, mode="human"): class ChooseSimpleDummyVecEnv (line 799) | class ChooseSimpleDummyVecEnv(ShareVecEnv): method __init__ (line 800) | def __init__(self, env_fns): method step_async (line 807) | def step_async(self, actions): method step_wait (line 810) | def step_wait(self): method reset (line 816) | def reset(self, reset_choose): method close (line 821) | def close(self): method render (line 825) | def render(self, mode="human"): FILE: MACPO/macpo/envs/safety_ma_mujoco/safety_multiagent_mujoco/ant.py class AntEnv (line 8) | class AntEnv(mujoco_env.MujocoEnv, utils.EzPickle): method __init__ (line 9) | def __init__(self, **kwargs): method step (line 13) | def step(self, a): method _get_obs (line 61) | def _get_obs(self): method reset_model (line 81) | def reset_model(self): method viewer_setup (line 89) | def viewer_setup(self): FILE: MACPO/macpo/envs/safety_ma_mujoco/safety_multiagent_mujoco/coupled_half_cheetah.py class CoupledHalfCheetah (line 9) | class CoupledHalfCheetah(mujoco_env.MujocoEnv, utils.EzPickle): method __init__ (line 10) | def __init__(self, **kwargs): method step (line 14) | def step(self, action): method _get_obs (line 117) | def _get_obs(self): method reset_model (line 137) | def reset_model(self): method viewer_setup (line 143) | def viewer_setup(self): method get_env_info (line 146) | def get_env_info(self): method _set_action_space (line 149) | def _set_action_space(self): FILE: MACPO/macpo/envs/safety_ma_mujoco/safety_multiagent_mujoco/half_cheetah.py class HalfCheetahEnv (line 10) | class HalfCheetahEnv(mujoco_env.MujocoEnv, utils.EzPickle): method __init__ (line 11) | def __init__(self, **kwargs): method step (line 16) | def step(self, action): method _get_obs (line 48) | def _get_obs(self): method reset_model (line 61) | def reset_model(self): method viewer_setup (line 67) | def viewer_setup(self): method _set_action_space (line 70) | def _set_action_space(self): FILE: MACPO/macpo/envs/safety_ma_mujoco/safety_multiagent_mujoco/hopper.py class HopperEnv (line 7) | class HopperEnv(mujoco_env.MujocoEnv, utils.EzPickle): method __init__ (line 8) | def __init__(self, **kwargs): method step (line 13) | def step(self, a): method _get_obs (line 50) | def _get_obs(self): method reset_model (line 63) | def reset_model(self): method last_mocap_x (line 69) | def last_mocap_x(self): method viewer_setup (line 72) | def viewer_setup(self): FILE: MACPO/macpo/envs/safety_ma_mujoco/safety_multiagent_mujoco/humanoid.py function mass_center (line 8) | def mass_center(model, sim): class HumanoidEnv (line 14) | class HumanoidEnv(mujoco_env.MujocoEnv, utils.EzPickle): method __init__ (line 15) | def __init__(self, **kwargs): method _get_obs (line 19) | def _get_obs(self): method step (line 44) | def step(self, a): method reset_model (line 85) | def reset_model(self): method viewer_setup (line 99) | def viewer_setup(self): FILE: MACPO/macpo/envs/safety_ma_mujoco/safety_multiagent_mujoco/manyagent_ant.py class ManyAgentAntEnv (line 10) | class ManyAgentAntEnv(mujoco_env.MujocoEnv, utils.EzPickle): method __init__ (line 11) | def __init__(self, **kwargs): method _generate_asset (line 33) | def _generate_asset(self, n_segs, asset_path): method step (line 86) | def step(self, a): method _get_obs (line 156) | def _get_obs(self): method reset_model (line 188) | def reset_model(self): method viewer_setup (line 196) | def viewer_setup(self): FILE: MACPO/macpo/envs/safety_ma_mujoco/safety_multiagent_mujoco/manyagent_swimmer.py class ManyAgentSwimmerEnv (line 9) | class ManyAgentSwimmerEnv(mujoco_env.MujocoEnv, utils.EzPickle): method __init__ (line 10) | def __init__(self, **kwargs): method _generate_asset (line 30) | def _generate_asset(self, n_segs, asset_path): method step (line 66) | def step(self, a): method _get_obs (line 123) | def _get_obs(self): method reset_model (line 144) | def reset_model(self): FILE: MACPO/macpo/envs/safety_ma_mujoco/safety_multiagent_mujoco/mujoco_env.py function convert_observation_to_space (line 19) | def convert_observation_to_space(observation): class MujocoEnv (line 35) | class MujocoEnv(gym.Env): method __init__ (line 39) | def __init__(self, model_path, frame_skip): method _set_action_space (line 71) | def _set_action_space(self): method _set_observation_space (line 77) | def _set_observation_space(self, observation): method seed (line 81) | def seed(self, seed=None): method reset_model (line 88) | def reset_model(self): method viewer_setup (line 95) | def viewer_setup(self): method reset (line 105) | def reset(self): method set_state (line 110) | def set_state(self, qpos, qvel): method dt (line 119) | def dt(self): method do_simulation (line 122) | def do_simulation(self, ctrl, n_frames): method render (line 127) | def render(self, method close (line 160) | def close(self): method _get_viewer (line 166) | def _get_viewer(self, mode): method get_body_com (line 178) | def get_body_com(self, body_name): method state_vector (line 181) | def state_vector(self): method place_random_objects (line 187) | def place_random_objects(self): FILE: MACPO/macpo/envs/safety_ma_mujoco/safety_multiagent_mujoco/mujoco_multi.py function env_fn (line 13) | def env_fn(env, **kwargs) -> MultiAgentEnv: # TODO: this may be a more ... class NormalizedActions (line 26) | class NormalizedActions(gym.ActionWrapper): method _action (line 28) | def _action(self, action): method action (line 34) | def action(self, action_): method _reverse_action (line 37) | def _reverse_action(self, action): class MujocoMulti (line 44) | class MujocoMulti(MultiAgentEnv): method __init__ (line 46) | def __init__(self, batch_size=None, **kwargs): method step (line 176) | def step(self, actions): method get_obs (line 205) | def get_obs(self): method get_obs_agent (line 220) | def get_obs_agent(self, agent_id): method get_obs_size (line 236) | def get_obs_size(self): method get_state (line 244) | def get_state(self, team=None): method get_state_size (line 257) | def get_state_size(self): method get_avail_actions (line 261) | def get_avail_actions(self): # all actions are always available method get_avail_agent_actions (line 264) | def get_avail_agent_actions(self, agent_id): method get_total_actions (line 268) | def get_total_actions(self): method get_stats (line 273) | def get_stats(self): method get_agg_stats (line 277) | def get_agg_stats(self, stats): method reset (line 280) | def reset(self, **kwargs): method render (line 286) | def render(self, **kwargs): method close (line 289) | def close(self): method seed (line 292) | def seed(self, args): method get_env_info (line 295) | def get_env_info(self): FILE: MACPO/macpo/envs/safety_ma_mujoco/safety_multiagent_mujoco/multiagentenv.py function convert (line 5) | def convert(dictionary): class MultiAgentEnv (line 8) | class MultiAgentEnv(object): method __init__ (line 10) | def __init__(self, batch_size=None, **kwargs): method step (line 21) | def step(self, actions): method get_obs (line 25) | def get_obs(self): method get_obs_agent (line 29) | def get_obs_agent(self, agent_id): method get_obs_size (line 33) | def get_obs_size(self): method get_state (line 37) | def get_state(self): method get_state_size (line 40) | def get_state_size(self): method get_avail_actions (line 44) | def get_avail_actions(self): method get_avail_agent_actions (line 47) | def get_avail_agent_actions(self, agent_id): method get_total_actions (line 51) | def get_total_actions(self): method get_stats (line 56) | def get_stats(self): method get_agg_stats (line 60) | def get_agg_stats(self, stats): method reset (line 63) | def reset(self): method render (line 67) | def render(self): method close (line 70) | def close(self): method seed (line 73) | def seed(self, seed): method get_env_info (line 76) | def get_env_info(self): FILE: MACPO/macpo/envs/safety_ma_mujoco/safety_multiagent_mujoco/obsk.py class Node (line 5) | class Node(): method __init__ (line 6) | def __init__(self, label, qpos_ids, qvel_ids, act_ids, body_fn=None, b... method __str__ (line 17) | def __str__(self): method __repr__ (line 20) | def __repr__(self): class HyperEdge (line 24) | class HyperEdge(): method __init__ (line 25) | def __init__(self, *edges): method __contains__ (line 28) | def __contains__(self, item): method __str__ (line 31) | def __str__(self): method __repr__ (line 34) | def __repr__(self): function get_joints_at_kdist (line 38) | def get_joints_at_kdist(agent_id, agent_partitions, hyperedges, k=0, kag... function build_obs (line 74) | def build_obs(env, k_dict, k_categories, global_dict, global_categories,... function build_actions (line 141) | def build_actions(agent_partitions, k_dict): function get_parts_and_edges (line 146) | def get_parts_and_edges(label, partitioning): FILE: MACPO/macpo/envs/safety_ma_mujoco/test.py function main (line 6) | def main(): FILE: MACPO/macpo/runner/separated/base_runner.py function _t2n (line 13) | def _t2n(x): class Runner (line 16) | class Runner(object): method __init__ (line 17) | def __init__(self, config): method run (line 105) | def run(self): method warmup (line 108) | def warmup(self): method collect (line 111) | def collect(self, step): method insert (line 114) | def insert(self, data): method compute (line 118) | def compute(self): method train (line 127) | def train(self): method save (line 139) | def save(self): method restore (line 150) | def restore(self): method log_train (line 161) | def log_train(self, train_infos, total_num_steps): method log_env (line 170) | def log_env(self, env_infos, total_num_steps): FILE: MACPO/macpo/runner/separated/base_runner_macpo.py function _t2n (line 14) | def _t2n(x): class Runner (line 18) | class Runner(object): method __init__ (line 19) | def __init__(self, config): method run (line 110) | def run(self): method warmup (line 113) | def warmup(self): method collect (line 116) | def collect(self, step): method insert (line 119) | def insert(self, data): method compute (line 123) | def compute(self): method train (line 138) | def train(self): method buffer_filter (line 192) | def buffer_filter(self, agent_id): method remove_episodes (line 219) | def remove_episodes(self, agent_id, del_ids): method save (line 244) | def save(self): method restore (line 255) | def restore(self): method log_train (line 266) | def log_train(self, train_infos, total_num_steps): method log_env (line 275) | def log_env(self, env_infos, total_num_steps): FILE: MACPO/macpo/runner/separated/mujoco_runner.py function _t2n (line 9) | def _t2n(x): class MujocoRunner (line 13) | class MujocoRunner(Runner): method __init__ (line 16) | def __init__(self, config): method run (line 19) | def run(self): method warmup (line 90) | def warmup(self): method collect (line 102) | def collect(self, step): method insert (line 130) | def insert(self, data): method log_train (line 158) | def log_train(self, train_infos, total_num_steps): method eval (line 170) | def eval(self, total_num_steps): FILE: MACPO/macpo/runner/separated/mujoco_runner_macpo.py function _t2n (line 11) | def _t2n(x): class MujocoRunner (line 15) | class MujocoRunner(Runner): method __init__ (line 18) | def __init__(self, config): method run (line 22) | def run(self): method return_aver_cost (line 118) | def return_aver_cost(self, aver_episode_costs): method warmup (line 125) | def warmup(self): method collect (line 138) | def collect(self, step): method insert (line 178) | def insert(self, data, aver_episode_costs = 0): method log_train (line 213) | def log_train(self, train_infos, total_num_steps): method eval (line 226) | def eval(self, total_num_steps): FILE: MACPO/macpo/scripts/train/train_mujoco.py function make_train_env (line 23) | def make_train_env(all_args): function make_eval_env (line 46) | def make_eval_env(all_args): function parse_args (line 69) | def parse_args(args, parser): function main (line 92) | def main(args): FILE: MACPO/macpo/utils/multi_discrete.py class MultiDiscrete (line 6) | class MultiDiscrete(gym.Space): method __init__ (line 22) | def __init__(self, array_of_param_array): method sample (line 28) | def sample(self): method contains (line 34) | def contains(self, x): method shape (line 38) | def shape(self): method __repr__ (line 41) | def __repr__(self): method __eq__ (line 44) | def __eq__(self, other): FILE: MACPO/macpo/utils/popart.py class PopArt (line 8) | class PopArt(nn.Module): method __init__ (line 11) | def __init__(self, input_shape, norm_axes=1, beta=0.99999, per_element... method reset_parameters (line 25) | def reset_parameters(self): method running_mean_var (line 30) | def running_mean_var(self): method forward (line 36) | def forward(self, input_vector, train=True): method denormalize (line 64) | def denormalize(self, input_vector): FILE: MACPO/macpo/utils/separated_buffer.py function _flatten (line 8) | def _flatten(T, N, x): function _cast (line 12) | def _cast(x): class SeparatedReplayBuffer (line 16) | class SeparatedReplayBuffer(object): method __init__ (line 17) | def __init__(self, args, obs_space, share_obs_space, act_space): method update_factor (line 74) | def update_factor(self, factor): method return_aver_insert (line 77) | def return_aver_insert(self, aver_episode_costs): method insert (line 80) | def insert(self, share_obs, obs, rnn_states, rnn_states_critic, action... method chooseinsert (line 110) | def chooseinsert(self, share_obs, obs, rnn_states, rnn_states_critic, ... method after_update (line 130) | def after_update(self): method chooseafter_update (line 142) | def chooseafter_update(self): method compute_returns (line 148) | def compute_returns(self, next_value, value_normalizer=None): method compute_cost_returns (line 195) | def compute_cost_returns(self, next_cost, value_normalizer=None): method feed_forward_generator (line 239) | def feed_forward_generator(self, advantages, num_mini_batch=None, mini... method naive_recurrent_generator (line 323) | def naive_recurrent_generator(self, advantages, num_mini_batch, cost_a... FILE: MACPO/macpo/utils/util.py function check (line 5) | def check(input): function get_gard_norm (line 9) | def get_gard_norm(it): function update_linear_schedule (line 17) | def update_linear_schedule(optimizer, epoch, total_num_epochs, initial_lr): function huber_loss (line 23) | def huber_loss(e, d): function mse_loss (line 28) | def mse_loss(e): function get_shape_from_obs_space (line 31) | def get_shape_from_obs_space(obs_space): function get_shape_from_act_space (line 40) | def get_shape_from_act_space(act_space): function tile_images (line 54) | def tile_images(img_nhwc): FILE: MACPO/setup.py function get_version (line 8) | def get_version() -> str: FILE: MAPPO-Lagrangian/mappo_lagrangian/algorithms/r_mappo/__init__.py function cost_trpo_macppo (line 1) | def cost_trpo_macppo(): FILE: MAPPO-Lagrangian/mappo_lagrangian/algorithms/r_mappo/algorithm/MACPPOPolicy.py class MACPPOPolicy (line 6) | class MACPPOPolicy: method __init__ (line 17) | def __init__(self, args, obs_space, cent_obs_space, act_space, device=... method lr_decay (line 44) | def lr_decay(self, episode, episodes): method get_actions (line 54) | def get_actions(self, cent_obs, obs, rnn_states_actor, rnn_states_crit... method get_values (line 87) | def get_values(self, cent_obs, rnn_states_critic, masks): method get_cost_values (line 99) | def get_cost_values(self, cent_obs, rnn_states_cost, masks): method evaluate_actions (line 111) | def evaluate_actions(self, cent_obs, obs, rnn_states_actor, rnn_states... method act (line 143) | def act(self, obs, rnn_states_actor, masks, available_actions=None, de... FILE: MAPPO-Lagrangian/mappo_lagrangian/algorithms/r_mappo/algorithm/rMAPPOPolicy.py class R_MAPPOPolicy (line 6) | class R_MAPPOPolicy: method __init__ (line 17) | def __init__(self, args, obs_space, cent_obs_space, act_space, device=... method lr_decay (line 39) | def lr_decay(self, episode, episodes): method get_actions (line 48) | def get_actions(self, cent_obs, obs, rnn_states_actor, rnn_states_crit... method get_values (line 76) | def get_values(self, cent_obs, rnn_states_critic, masks): method evaluate_actions (line 88) | def evaluate_actions(self, cent_obs, obs, rnn_states_actor, rnn_states... method act (line 116) | def act(self, obs, rnn_states_actor, masks, available_actions=None, de... FILE: MAPPO-Lagrangian/mappo_lagrangian/algorithms/r_mappo/algorithm/r_actor_critic.py class R_Actor (line 11) | class R_Actor(nn.Module): method __init__ (line 19) | def __init__(self, args, obs_space, action_space, device=torch.device(... method forward (line 42) | def forward(self, obs, rnn_states, masks, available_actions=None, dete... method evaluate_actions (line 71) | def evaluate_actions(self, obs, rnn_states, action, masks, available_a... class R_Critic (line 109) | class R_Critic(nn.Module): method __init__ (line 117) | def __init__(self, args, cent_obs_space, device=torch.device("cpu")): method forward (line 141) | def forward(self, cent_obs, rnn_states, masks): FILE: MAPPO-Lagrangian/mappo_lagrangian/algorithms/r_mappo/r_mappo_lagr.py class R_MAPPO_Lagr (line 8) | class R_MAPPO_Lagr: method __init__ (line 26) | def __init__(self, method cal_value_loss (line 86) | def cal_value_loss(self, values, value_preds_batch, return_batch, acti... method _get_flat_grad (line 126) | def _get_flat_grad(self, y: torch.Tensor, model: nn.Module, **kwargs) ... method _conjugate_gradients (line 137) | def _conjugate_gradients(self, b: torch.Tensor, flat_kl_grad: torch.Te... method cal_second_hessian (line 156) | def cal_second_hessian(self, v: torch.Tensor, flat_kl_grad: torch.Tens... method _set_from_flat_params (line 164) | def _set_from_flat_params(self, model: nn.Module, flat_params: torch.T... method ppo_update (line 173) | def ppo_update(self, sample, update_actor=True, precomputed_eval=None, method train (line 303) | def train(self, buffer, update_actor=True): method prep_training (line 370) | def prep_training(self): method prep_rollout (line 375) | def prep_rollout(self): FILE: MAPPO-Lagrangian/mappo_lagrangian/algorithms/utils/act.py class ACTLayer (line 5) | class ACTLayer(nn.Module): method __init__ (line 13) | def __init__(self, action_space, inputs_dim, use_orthogonal, gain, arg... method forward (line 41) | def forward(self, x, available_actions=None, deterministic=False): method get_probs (line 85) | def get_probs(self, x, available_actions=None): method evaluate_actions (line 107) | def evaluate_actions(self, x, action, available_actions=None, active_m... FILE: MAPPO-Lagrangian/mappo_lagrangian/algorithms/utils/cnn.py class Flatten (line 6) | class Flatten(nn.Module): method forward (line 7) | def forward(self, x): class CNNLayer (line 11) | class CNNLayer(nn.Module): method __init__ (line 12) | def __init__(self, obs_shape, hidden_size, use_orthogonal, use_ReLU, k... method forward (line 40) | def forward(self, x): class CNNBase (line 46) | class CNNBase(nn.Module): method __init__ (line 47) | def __init__(self, args, obs_shape): method forward (line 56) | def forward(self, x): FILE: MAPPO-Lagrangian/mappo_lagrangian/algorithms/utils/distributions.py class FixedCategorical (line 14) | class FixedCategorical(torch.distributions.Categorical): method sample (line 15) | def sample(self): method log_probs (line 18) | def log_probs(self, actions): method mode (line 27) | def mode(self): class FixedNormal (line 32) | class FixedNormal(torch.distributions.Normal): method log_probs (line 33) | def log_probs(self, actions): method entrop (line 37) | def entrop(self): method mode (line 40) | def mode(self): class FixedBernoulli (line 45) | class FixedBernoulli(torch.distributions.Bernoulli): method log_probs (line 46) | def log_probs(self, actions): method entropy (line 49) | def entropy(self): method mode (line 52) | def mode(self): class Categorical (line 56) | class Categorical(nn.Module): method __init__ (line 57) | def __init__(self, num_inputs, num_outputs, use_orthogonal=True, gain=... method forward (line 65) | def forward(self, x, available_actions=None): class DiagGaussian (line 94) | class DiagGaussian(nn.Module): method __init__ (line 95) | def __init__(self, num_inputs, num_outputs, use_orthogonal=True, gain=... method forward (line 113) | def forward(self, x, available_actions=None): class Bernoulli (line 118) | class Bernoulli(nn.Module): method __init__ (line 119) | def __init__(self, num_inputs, num_outputs, use_orthogonal=True, gain=... method forward (line 127) | def forward(self, x): class AddBias (line 131) | class AddBias(nn.Module): method __init__ (line 132) | def __init__(self, bias): method forward (line 136) | def forward(self, x): FILE: MAPPO-Lagrangian/mappo_lagrangian/algorithms/utils/mlp.py class MLPLayer (line 6) | class MLPLayer(nn.Module): method __init__ (line 7) | def __init__(self, input_dim, hidden_size, layer_N, use_orthogonal, us... method forward (line 24) | def forward(self, x): class MLPBase (line 31) | class MLPBase(nn.Module): method __init__ (line 32) | def __init__(self, args, obs_shape, cat_self=True, attn_internal=False): method forward (line 50) | def forward(self, x): FILE: MAPPO-Lagrangian/mappo_lagrangian/algorithms/utils/rnn.py class RNNLayer (line 7) | class RNNLayer(nn.Module): method __init__ (line 8) | def __init__(self, inputs_dim, outputs_dim, recurrent_N, use_orthogonal): method forward (line 24) | def forward(self, x, hxs, masks): FILE: MAPPO-Lagrangian/mappo_lagrangian/algorithms/utils/util.py function init (line 7) | def init(module, weight_init, bias_init, gain=1): function get_clones (line 12) | def get_clones(module, N): function check (line 15) | def check(input): FILE: MAPPO-Lagrangian/mappo_lagrangian/config.py function get_config (line 4) | def get_config(): FILE: MAPPO-Lagrangian/mappo_lagrangian/envs/env_wrappers.py class CloudpickleWrapper (line 10) | class CloudpickleWrapper(object): method __init__ (line 15) | def __init__(self, x): method __getstate__ (line 18) | def __getstate__(self): method __setstate__ (line 22) | def __setstate__(self, ob): class ShareVecEnv (line 27) | class ShareVecEnv(ABC): method __init__ (line 41) | def __init__(self, num_envs, observation_space, share_observation_spac... method reset (line 48) | def reset(self): method step_async (line 60) | def step_async(self, actions): method step_wait (line 72) | def step_wait(self): method close_extras (line 86) | def close_extras(self): method close (line 93) | def close(self): method step (line 101) | def step(self, actions): method render (line 110) | def render(self, mode='human'): method get_images (line 121) | def get_images(self): method unwrapped (line 128) | def unwrapped(self): method get_viewer (line 134) | def get_viewer(self): function worker (line 141) | def worker(remote, parent_remote, env_fn_wrapper): class GuardSubprocVecEnv (line 178) | class GuardSubprocVecEnv(ShareVecEnv): method __init__ (line 179) | def __init__(self, env_fns, spaces=None): method step_async (line 200) | def step_async(self, actions): method step_wait (line 206) | def step_wait(self): method reset (line 212) | def reset(self): method reset_task (line 218) | def reset_task(self): method close (line 223) | def close(self): class SubprocVecEnv (line 236) | class SubprocVecEnv(ShareVecEnv): method __init__ (line 237) | def __init__(self, env_fns, spaces=None): method step_async (line 258) | def step_async(self, actions): method step_wait (line 263) | def step_wait(self): method reset (line 269) | def reset(self): method reset_task (line 276) | def reset_task(self): method close (line 281) | def close(self): method render (line 293) | def render(self, mode="rgb_array"): function shareworker (line 301) | def shareworker(remote, parent_remote, env_fn_wrapper): class ShareSubprocVecEnv (line 344) | class ShareSubprocVecEnv(ShareVecEnv): method __init__ (line 345) | def __init__(self, env_fns, spaces=None): method step_async (line 369) | def step_async(self, actions): method step_wait (line 374) | def step_wait(self): method reset (line 384) | def reset(self): method reset_task (line 391) | def reset_task(self): method close (line 396) | def close(self): function choosesimpleworker (line 409) | def choosesimpleworker(remote, parent_remote, env_fn_wrapper): class ChooseSimpleSubprocVecEnv (line 440) | class ChooseSimpleSubprocVecEnv(ShareVecEnv): method __init__ (line 441) | def __init__(self, env_fns, spaces=None): method step_async (line 461) | def step_async(self, actions): method step_wait (line 466) | def step_wait(self): method reset (line 472) | def reset(self, reset_choose): method render (line 478) | def render(self, mode="rgb_array"): method reset_task (line 485) | def reset_task(self): method close (line 490) | def close(self): function chooseworker (line 503) | def chooseworker(remote, parent_remote, env_fn_wrapper): class ChooseSubprocVecEnv (line 530) | class ChooseSubprocVecEnv(ShareVecEnv): method __init__ (line 531) | def __init__(self, env_fns, spaces=None): method step_async (line 552) | def step_async(self, actions): method step_wait (line 557) | def step_wait(self): method reset (line 563) | def reset(self, reset_choose): method reset_task (line 570) | def reset_task(self): method close (line 575) | def close(self): function chooseguardworker (line 588) | def chooseguardworker(remote, parent_remote, env_fn_wrapper): class ChooseGuardSubprocVecEnv (line 613) | class ChooseGuardSubprocVecEnv(ShareVecEnv): method __init__ (line 614) | def __init__(self, env_fns, spaces=None): method step_async (line 635) | def step_async(self, actions): method step_wait (line 640) | def step_wait(self): method reset (line 646) | def reset(self, reset_choose): method reset_task (line 652) | def reset_task(self): method close (line 657) | def close(self): class DummyVecEnv (line 671) | class DummyVecEnv(ShareVecEnv): method __init__ (line 672) | def __init__(self, env_fns): method step_async (line 679) | def step_async(self, actions): method step_wait (line 682) | def step_wait(self): method reset (line 697) | def reset(self): method close (line 701) | def close(self): method render (line 705) | def render(self, mode="human"): class ShareDummyVecEnv (line 716) | class ShareDummyVecEnv(ShareVecEnv): method __init__ (line 717) | def __init__(self, env_fns): method step_async (line 724) | def step_async(self, actions): method step_wait (line 727) | def step_wait(self): method reset (line 743) | def reset(self): method close (line 748) | def close(self): method render (line 752) | def render(self, mode="human"): class ChooseDummyVecEnv (line 762) | class ChooseDummyVecEnv(ShareVecEnv): method __init__ (line 763) | def __init__(self, env_fns): method step_async (line 770) | def step_async(self, actions): method step_wait (line 773) | def step_wait(self): method reset (line 780) | def reset(self, reset_choose): method close (line 786) | def close(self): method render (line 790) | def render(self, mode="human"): class ChooseSimpleDummyVecEnv (line 799) | class ChooseSimpleDummyVecEnv(ShareVecEnv): method __init__ (line 800) | def __init__(self, env_fns): method step_async (line 807) | def step_async(self, actions): method step_wait (line 810) | def step_wait(self): method reset (line 816) | def reset(self, reset_choose): method close (line 821) | def close(self): method render (line 825) | def render(self, mode="human"): FILE: MAPPO-Lagrangian/mappo_lagrangian/envs/safety_ma_mujoco/safety_multiagent_mujoco/ant.py class AntEnv (line 8) | class AntEnv(mujoco_env.MujocoEnv, utils.EzPickle): method __init__ (line 9) | def __init__(self, **kwargs): method step (line 13) | def step(self, a): method _get_obs (line 61) | def _get_obs(self): method reset_model (line 81) | def reset_model(self): method viewer_setup (line 89) | def viewer_setup(self): FILE: MAPPO-Lagrangian/mappo_lagrangian/envs/safety_ma_mujoco/safety_multiagent_mujoco/coupled_half_cheetah.py class CoupledHalfCheetah (line 9) | class CoupledHalfCheetah(mujoco_env.MujocoEnv, utils.EzPickle): method __init__ (line 10) | def __init__(self, **kwargs): method step (line 14) | def step(self, action): method _get_obs (line 117) | def _get_obs(self): method reset_model (line 137) | def reset_model(self): method viewer_setup (line 143) | def viewer_setup(self): method get_env_info (line 146) | def get_env_info(self): method _set_action_space (line 149) | def _set_action_space(self): FILE: MAPPO-Lagrangian/mappo_lagrangian/envs/safety_ma_mujoco/safety_multiagent_mujoco/half_cheetah.py class HalfCheetahEnv (line 10) | class HalfCheetahEnv(mujoco_env.MujocoEnv, utils.EzPickle): method __init__ (line 11) | def __init__(self, **kwargs): method step (line 16) | def step(self, action): method _get_obs (line 48) | def _get_obs(self): method reset_model (line 61) | def reset_model(self): method viewer_setup (line 67) | def viewer_setup(self): method _set_action_space (line 70) | def _set_action_space(self): FILE: MAPPO-Lagrangian/mappo_lagrangian/envs/safety_ma_mujoco/safety_multiagent_mujoco/hopper.py class HopperEnv (line 7) | class HopperEnv(mujoco_env.MujocoEnv, utils.EzPickle): method __init__ (line 8) | def __init__(self, **kwargs): method step (line 13) | def step(self, a): method _get_obs (line 50) | def _get_obs(self): method reset_model (line 63) | def reset_model(self): method last_mocap_x (line 69) | def last_mocap_x(self): method viewer_setup (line 72) | def viewer_setup(self): FILE: MAPPO-Lagrangian/mappo_lagrangian/envs/safety_ma_mujoco/safety_multiagent_mujoco/humanoid.py function mass_center (line 8) | def mass_center(model, sim): class HumanoidEnv (line 14) | class HumanoidEnv(mujoco_env.MujocoEnv, utils.EzPickle): method __init__ (line 15) | def __init__(self, **kwargs): method _get_obs (line 19) | def _get_obs(self): method step (line 44) | def step(self, a): method reset_model (line 85) | def reset_model(self): method viewer_setup (line 99) | def viewer_setup(self): FILE: MAPPO-Lagrangian/mappo_lagrangian/envs/safety_ma_mujoco/safety_multiagent_mujoco/manyagent_ant.py class ManyAgentAntEnv (line 10) | class ManyAgentAntEnv(mujoco_env.MujocoEnv, utils.EzPickle): method __init__ (line 11) | def __init__(self, **kwargs): method _generate_asset (line 33) | def _generate_asset(self, n_segs, asset_path): method step (line 86) | def step(self, a): method _get_obs (line 154) | def _get_obs(self): method reset_model (line 186) | def reset_model(self): method viewer_setup (line 194) | def viewer_setup(self): FILE: MAPPO-Lagrangian/mappo_lagrangian/envs/safety_ma_mujoco/safety_multiagent_mujoco/manyagent_swimmer.py class ManyAgentSwimmerEnv (line 9) | class ManyAgentSwimmerEnv(mujoco_env.MujocoEnv, utils.EzPickle): method __init__ (line 10) | def __init__(self, **kwargs): method _generate_asset (line 30) | def _generate_asset(self, n_segs, asset_path): method step (line 66) | def step(self, a): method _get_obs (line 123) | def _get_obs(self): method reset_model (line 144) | def reset_model(self): FILE: MAPPO-Lagrangian/mappo_lagrangian/envs/safety_ma_mujoco/safety_multiagent_mujoco/mujoco_env.py function convert_observation_to_space (line 19) | def convert_observation_to_space(observation): class MujocoEnv (line 35) | class MujocoEnv(gym.Env): method __init__ (line 39) | def __init__(self, model_path, frame_skip): method _set_action_space (line 71) | def _set_action_space(self): method _set_observation_space (line 77) | def _set_observation_space(self, observation): method seed (line 81) | def seed(self, seed=None): method reset_model (line 88) | def reset_model(self): method viewer_setup (line 95) | def viewer_setup(self): method reset (line 105) | def reset(self): method set_state (line 110) | def set_state(self, qpos, qvel): method dt (line 119) | def dt(self): method do_simulation (line 122) | def do_simulation(self, ctrl, n_frames): method render (line 127) | def render(self, method close (line 160) | def close(self): method _get_viewer (line 166) | def _get_viewer(self, mode): method get_body_com (line 178) | def get_body_com(self, body_name): method state_vector (line 181) | def state_vector(self): method place_random_objects (line 187) | def place_random_objects(self): FILE: MAPPO-Lagrangian/mappo_lagrangian/envs/safety_ma_mujoco/safety_multiagent_mujoco/mujoco_multi.py function env_fn (line 13) | def env_fn(env, **kwargs) -> MultiAgentEnv: # TODO: this may be a more ... class NormalizedActions (line 26) | class NormalizedActions(gym.ActionWrapper): method _action (line 28) | def _action(self, action): method action (line 34) | def action(self, action_): method _reverse_action (line 37) | def _reverse_action(self, action): class MujocoMulti (line 44) | class MujocoMulti(MultiAgentEnv): method __init__ (line 46) | def __init__(self, batch_size=None, **kwargs): method step (line 176) | def step(self, actions): method get_obs (line 205) | def get_obs(self): method get_obs_agent (line 220) | def get_obs_agent(self, agent_id): method get_obs_size (line 236) | def get_obs_size(self): method get_state (line 244) | def get_state(self, team=None): method get_state_size (line 257) | def get_state_size(self): method get_avail_actions (line 261) | def get_avail_actions(self): # all actions are always available method get_avail_agent_actions (line 264) | def get_avail_agent_actions(self, agent_id): method get_total_actions (line 268) | def get_total_actions(self): method get_stats (line 273) | def get_stats(self): method get_agg_stats (line 277) | def get_agg_stats(self, stats): method reset (line 280) | def reset(self, **kwargs): method render (line 286) | def render(self, **kwargs): method close (line 289) | def close(self): method seed (line 292) | def seed(self, args): method get_env_info (line 295) | def get_env_info(self): FILE: MAPPO-Lagrangian/mappo_lagrangian/envs/safety_ma_mujoco/safety_multiagent_mujoco/multiagentenv.py function convert (line 5) | def convert(dictionary): class MultiAgentEnv (line 8) | class MultiAgentEnv(object): method __init__ (line 10) | def __init__(self, batch_size=None, **kwargs): method step (line 21) | def step(self, actions): method get_obs (line 25) | def get_obs(self): method get_obs_agent (line 29) | def get_obs_agent(self, agent_id): method get_obs_size (line 33) | def get_obs_size(self): method get_state (line 37) | def get_state(self): method get_state_size (line 40) | def get_state_size(self): method get_avail_actions (line 44) | def get_avail_actions(self): method get_avail_agent_actions (line 47) | def get_avail_agent_actions(self, agent_id): method get_total_actions (line 51) | def get_total_actions(self): method get_stats (line 56) | def get_stats(self): method get_agg_stats (line 60) | def get_agg_stats(self, stats): method reset (line 63) | def reset(self): method render (line 67) | def render(self): method close (line 70) | def close(self): method seed (line 73) | def seed(self, seed): method get_env_info (line 76) | def get_env_info(self): FILE: MAPPO-Lagrangian/mappo_lagrangian/envs/safety_ma_mujoco/safety_multiagent_mujoco/obsk.py class Node (line 5) | class Node(): method __init__ (line 6) | def __init__(self, label, qpos_ids, qvel_ids, act_ids, body_fn=None, b... method __str__ (line 17) | def __str__(self): method __repr__ (line 20) | def __repr__(self): class HyperEdge (line 24) | class HyperEdge(): method __init__ (line 25) | def __init__(self, *edges): method __contains__ (line 28) | def __contains__(self, item): method __str__ (line 31) | def __str__(self): method __repr__ (line 34) | def __repr__(self): function get_joints_at_kdist (line 38) | def get_joints_at_kdist(agent_id, agent_partitions, hyperedges, k=0, kag... function build_obs (line 74) | def build_obs(env, k_dict, k_categories, global_dict, global_categories,... function build_actions (line 141) | def build_actions(agent_partitions, k_dict): function get_parts_and_edges (line 146) | def get_parts_and_edges(label, partitioning): FILE: MAPPO-Lagrangian/mappo_lagrangian/envs/safety_ma_mujoco/test.py function main (line 6) | def main(): FILE: MAPPO-Lagrangian/mappo_lagrangian/runner/separated/base_runner.py function _t2n (line 13) | def _t2n(x): class Runner (line 16) | class Runner(object): method __init__ (line 17) | def __init__(self, config): method run (line 105) | def run(self): method warmup (line 108) | def warmup(self): method collect (line 111) | def collect(self, step): method insert (line 114) | def insert(self, data): method compute (line 118) | def compute(self): method train (line 127) | def train(self): method save (line 139) | def save(self): method restore (line 150) | def restore(self): method log_train (line 161) | def log_train(self, train_infos, total_num_steps): method log_env (line 170) | def log_env(self, env_infos, total_num_steps): FILE: MAPPO-Lagrangian/mappo_lagrangian/runner/separated/base_runner_mappo_lagr.py function _t2n (line 14) | def _t2n(x): class Runner (line 18) | class Runner(object): method __init__ (line 19) | def __init__(self, config): method run (line 113) | def run(self): method warmup (line 116) | def warmup(self): method collect (line 119) | def collect(self, step): method insert (line 122) | def insert(self, data): method compute (line 126) | def compute(self): method train (line 141) | def train(self): method buffer_filter (line 185) | def buffer_filter(self, agent_id): method remove_episodes (line 214) | def remove_episodes(self, agent_id, del_ids): method save (line 241) | def save(self): method restore (line 252) | def restore(self): method log_train (line 263) | def log_train(self, train_infos, total_num_steps): method log_env (line 272) | def log_env(self, env_infos, total_num_steps): FILE: MAPPO-Lagrangian/mappo_lagrangian/runner/separated/mujoco_runner.py function _t2n (line 9) | def _t2n(x): class MujocoRunner (line 13) | class MujocoRunner(Runner): method __init__ (line 16) | def __init__(self, config): method run (line 19) | def run(self): method warmup (line 90) | def warmup(self): method collect (line 102) | def collect(self, step): method insert (line 130) | def insert(self, data): method log_train (line 158) | def log_train(self, train_infos, total_num_steps): method eval (line 170) | def eval(self, total_num_steps): FILE: MAPPO-Lagrangian/mappo_lagrangian/runner/separated/mujoco_runner_mappo_lagr.py function _t2n (line 11) | def _t2n(x): class MujocoRunner (line 15) | class MujocoRunner(Runner): method __init__ (line 18) | def __init__(self, config): method run (line 21) | def run(self): method return_aver_cost (line 105) | def return_aver_cost(self, aver_episode_costs): method warmup (line 109) | def warmup(self): method collect (line 122) | def collect(self, step): method insert (line 162) | def insert(self, data): method log_train (line 195) | def log_train(self, train_infos, total_num_steps): method eval (line 208) | def eval(self, total_num_steps): FILE: MAPPO-Lagrangian/mappo_lagrangian/scripts/eval/eval_hanabi.py function make_train_env (line 18) | def make_train_env(all_args): function make_eval_env (line 38) | def make_eval_env(all_args): function parse_args (line 59) | def parse_args(args, parser): function main (line 70) | def main(args): FILE: MAPPO-Lagrangian/mappo_lagrangian/scripts/train/train_mujoco.py function make_train_env (line 23) | def make_train_env(all_args): function make_eval_env (line 46) | def make_eval_env(all_args): function parse_args (line 69) | def parse_args(args, parser): function main (line 92) | def main(args): FILE: MAPPO-Lagrangian/mappo_lagrangian/utils/multi_discrete.py class MultiDiscrete (line 6) | class MultiDiscrete(gym.Space): method __init__ (line 22) | def __init__(self, array_of_param_array): method sample (line 28) | def sample(self): method contains (line 34) | def contains(self, x): method shape (line 38) | def shape(self): method __repr__ (line 41) | def __repr__(self): method __eq__ (line 44) | def __eq__(self, other): FILE: MAPPO-Lagrangian/mappo_lagrangian/utils/popart.py class PopArt (line 8) | class PopArt(nn.Module): method __init__ (line 11) | def __init__(self, input_shape, norm_axes=1, beta=0.99999, per_element... method reset_parameters (line 25) | def reset_parameters(self): method running_mean_var (line 30) | def running_mean_var(self): method forward (line 36) | def forward(self, input_vector, train=True): method denormalize (line 64) | def denormalize(self, input_vector): FILE: MAPPO-Lagrangian/mappo_lagrangian/utils/separated_buffer.py function _flatten (line 8) | def _flatten(T, N, x): function _cast (line 12) | def _cast(x): class SeparatedReplayBuffer (line 16) | class SeparatedReplayBuffer(object): method __init__ (line 17) | def __init__(self, args, obs_space, share_obs_space, act_space): method update_factor (line 74) | def update_factor(self, factor): method return_aver_insert (line 77) | def return_aver_insert(self, aver_episode_costs): method insert (line 80) | def insert(self, share_obs, obs, rnn_states, rnn_states_critic, action... method chooseinsert (line 107) | def chooseinsert(self, share_obs, obs, rnn_states, rnn_states_critic, ... method after_update (line 127) | def after_update(self): method chooseafter_update (line 139) | def chooseafter_update(self): method compute_returns (line 145) | def compute_returns(self, next_value, value_normalizer=None): method compute_cost_returns (line 192) | def compute_cost_returns(self, next_cost, value_normalizer=None): method feed_forward_generator (line 236) | def feed_forward_generator(self, advantages, num_mini_batch=None, mini... method naive_recurrent_generator (line 313) | def naive_recurrent_generator(self, advantages, num_mini_batch, cost_a... FILE: MAPPO-Lagrangian/mappo_lagrangian/utils/shared_buffer.py function _flatten (line 6) | def _flatten(T, N, x): function _cast (line 10) | def _cast(x): class SharedReplayBuffer (line 14) | class SharedReplayBuffer(object): method __init__ (line 24) | def __init__(self, args, num_agents, obs_space, cent_obs_space, act_sp... method insert (line 80) | def insert(self, share_obs, obs, rnn_states_actor, rnn_states_critic, ... method chooseinsert (line 115) | def chooseinsert(self, share_obs, obs, rnn_states, rnn_states_critic, ... method after_update (line 150) | def after_update(self): method chooseafter_update (line 162) | def chooseafter_update(self): method compute_returns (line 169) | def compute_returns(self, next_value, value_normalizer=None): method feed_forward_generator (line 195) | def feed_forward_generator(self, advantages, num_mini_batch=None, mini... method naive_recurrent_generator (line 257) | def naive_recurrent_generator(self, advantages, num_mini_batch): method recurrent_generator (line 354) | def recurrent_generator(self, advantages, num_mini_batch, data_chunk_l... FILE: MAPPO-Lagrangian/mappo_lagrangian/utils/util.py function check (line 5) | def check(input): function get_gard_norm (line 9) | def get_gard_norm(it): function update_linear_schedule (line 17) | def update_linear_schedule(optimizer, epoch, total_num_epochs, initial_lr): function huber_loss (line 23) | def huber_loss(e, d): function mse_loss (line 28) | def mse_loss(e): function get_shape_from_obs_space (line 31) | def get_shape_from_obs_space(obs_space): function get_shape_from_act_space (line 40) | def get_shape_from_act_space(act_space): function tile_images (line 54) | def tile_images(img_nhwc): FILE: MAPPO-Lagrangian/setup.py function get_version (line 8) | def get_version() -> str: