SYMBOL INDEX (311 symbols across 17 files) FILE: gym_vec_api/ppo_multidiscrete.py function parse_args (line 17) | def parse_args(): function make_env (line 81) | def make_env(gym_id, seed, idx, capture_video, run_name): function layer_init (line 96) | def layer_init(layer, std=np.sqrt(2), bias_const=0.0): class Transpose (line 102) | class Transpose(nn.Module): method __init__ (line 103) | def __init__(self, permutation): method forward (line 107) | def forward(self, x): class Agent (line 111) | class Agent(nn.Module): method __init__ (line 112) | def __init__(self, envs): method get_value (line 128) | def get_value(self, x): method get_action_and_value (line 131) | def get_action_and_value(self, x, action=None): FILE: gym_vec_api/ppo_multidiscrete_mask.py function parse_args (line 17) | def parse_args(): function make_env (line 81) | def make_env(gym_id, seed, idx, capture_video, run_name): function layer_init (line 96) | def layer_init(layer, std=np.sqrt(2), bias_const=0.0): class Transpose (line 102) | class Transpose(nn.Module): method __init__ (line 103) | def __init__(self, permutation): method forward (line 107) | def forward(self, x): class CategoricalMasked (line 111) | class CategoricalMasked(Categorical): method __init__ (line 112) | def __init__(self, probs=None, logits=None, validate_args=None, masks=... method entropy (line 121) | def entropy(self): class Agent (line 129) | class Agent(nn.Module): method __init__ (line 130) | def __init__(self, envs): method get_value (line 146) | def get_value(self, x): method get_action_and_value (line 149) | def get_action_and_value(self, x, action_mask, action=None): FILE: invalid_action_masking/ppo_10x10.py class RunningMeanStd (line 21) | class RunningMeanStd(object): method __init__ (line 22) | def __init__(self, epsilon=1e-4, shape=()): method update (line 27) | def update(self, x): method update_from_moments (line 33) | def update_from_moments(self, batch_mean, batch_var, batch_count): function update_mean_var_count_from_moments (line 37) | def update_mean_var_count_from_moments(mean, var, count, batch_mean, bat... class NormalizedEnv (line 49) | class NormalizedEnv(gym.core.Wrapper): method __init__ (line 50) | def __init__(self, env, ob=True, ret=True, clipob=10., cliprew=10., ga... method step (line 60) | def step(self, action): method _obfilt (line 73) | def _obfilt(self, obs): method reset (line 81) | def reset(self): class CategoricalMasked (line 201) | class CategoricalMasked(Categorical): method __init__ (line 202) | def __init__(self, probs=None, logits=None, validate_args=None, masks=... method entropy (line 211) | def entropy(self): class Policy (line 218) | class Policy(nn.Module): method __init__ (line 219) | def __init__(self): method forward (line 234) | def forward(self, x): method get_action (line 241) | def get_action(self, x, action=None, invalid_action_masks=None): class Value (line 256) | class Value(nn.Module): method __init__ (line 257) | def __init__(self): method forward (line 272) | def forward(self, x): function discount_cumsum (line 279) | def discount_cumsum(x, dones, gamma): function evaluate_with_no_mask (line 317) | def evaluate_with_no_mask(): FILE: invalid_action_masking/ppo_16x16.py class RunningMeanStd (line 21) | class RunningMeanStd(object): method __init__ (line 22) | def __init__(self, epsilon=1e-4, shape=()): method update (line 27) | def update(self, x): method update_from_moments (line 33) | def update_from_moments(self, batch_mean, batch_var, batch_count): function update_mean_var_count_from_moments (line 37) | def update_mean_var_count_from_moments(mean, var, count, batch_mean, bat... class NormalizedEnv (line 49) | class NormalizedEnv(gym.core.Wrapper): method __init__ (line 50) | def __init__(self, env, ob=True, ret=True, clipob=10., cliprew=10., ga... method step (line 60) | def step(self, action): method _obfilt (line 73) | def _obfilt(self, obs): method reset (line 81) | def reset(self): class CategoricalMasked (line 201) | class CategoricalMasked(Categorical): method __init__ (line 202) | def __init__(self, probs=None, logits=None, validate_args=None, masks=... method entropy (line 211) | def entropy(self): class Policy (line 218) | class Policy(nn.Module): method __init__ (line 219) | def __init__(self): method forward (line 234) | def forward(self, x): method get_action (line 241) | def get_action(self, x, action=None, invalid_action_masks=None): class Value (line 256) | class Value(nn.Module): method __init__ (line 257) | def __init__(self): method forward (line 272) | def forward(self, x): function discount_cumsum (line 279) | def discount_cumsum(x, dones, gamma): function evaluate_with_no_mask (line 317) | def evaluate_with_no_mask(): FILE: invalid_action_masking/ppo_24x24.py class RunningMeanStd (line 21) | class RunningMeanStd(object): method __init__ (line 22) | def __init__(self, epsilon=1e-4, shape=()): method update (line 27) | def update(self, x): method update_from_moments (line 33) | def update_from_moments(self, batch_mean, batch_var, batch_count): function update_mean_var_count_from_moments (line 37) | def update_mean_var_count_from_moments(mean, var, count, batch_mean, bat... class NormalizedEnv (line 49) | class NormalizedEnv(gym.core.Wrapper): method __init__ (line 50) | def __init__(self, env, ob=True, ret=True, clipob=10., cliprew=10., ga... method step (line 60) | def step(self, action): method _obfilt (line 73) | def _obfilt(self, obs): method reset (line 81) | def reset(self): class CategoricalMasked (line 201) | class CategoricalMasked(Categorical): method __init__ (line 202) | def __init__(self, probs=None, logits=None, validate_args=None, masks=... method entropy (line 211) | def entropy(self): class Policy (line 218) | class Policy(nn.Module): method __init__ (line 219) | def __init__(self): method forward (line 234) | def forward(self, x): method get_action (line 241) | def get_action(self, x, action=None, invalid_action_masks=None): class Value (line 256) | class Value(nn.Module): method __init__ (line 257) | def __init__(self): method forward (line 272) | def forward(self, x): function discount_cumsum (line 279) | def discount_cumsum(x, dones, gamma): function evaluate_with_no_mask (line 317) | def evaluate_with_no_mask(): FILE: invalid_action_masking/ppo_4x4.py class RunningMeanStd (line 21) | class RunningMeanStd(object): method __init__ (line 22) | def __init__(self, epsilon=1e-4, shape=()): method update (line 27) | def update(self, x): method update_from_moments (line 33) | def update_from_moments(self, batch_mean, batch_var, batch_count): function update_mean_var_count_from_moments (line 37) | def update_mean_var_count_from_moments(mean, var, count, batch_mean, bat... class NormalizedEnv (line 49) | class NormalizedEnv(gym.core.Wrapper): method __init__ (line 50) | def __init__(self, env, ob=True, ret=True, clipob=10., cliprew=10., ga... method step (line 60) | def step(self, action): method _obfilt (line 73) | def _obfilt(self, obs): method reset (line 81) | def reset(self): class CategoricalMasked (line 201) | class CategoricalMasked(Categorical): method __init__ (line 202) | def __init__(self, probs=None, logits=None, validate_args=None, masks=... method entropy (line 211) | def entropy(self): class Policy (line 218) | class Policy(nn.Module): method __init__ (line 219) | def __init__(self): method forward (line 230) | def forward(self, x): method get_action (line 237) | def get_action(self, x, action=None, invalid_action_masks=None): class Value (line 252) | class Value(nn.Module): method __init__ (line 253) | def __init__(self): method forward (line 265) | def forward(self, x): function discount_cumsum (line 272) | def discount_cumsum(x, dones, gamma): function evaluate_with_no_mask (line 310) | def evaluate_with_no_mask(): FILE: invalid_action_masking/ppo_no_adj_10x10.py class RunningMeanStd (line 21) | class RunningMeanStd(object): method __init__ (line 22) | def __init__(self, epsilon=1e-4, shape=()): method update (line 27) | def update(self, x): method update_from_moments (line 33) | def update_from_moments(self, batch_mean, batch_var, batch_count): function update_mean_var_count_from_moments (line 37) | def update_mean_var_count_from_moments(mean, var, count, batch_mean, bat... class NormalizedEnv (line 49) | class NormalizedEnv(gym.core.Wrapper): method __init__ (line 50) | def __init__(self, env, ob=True, ret=True, clipob=10., cliprew=10., ga... method step (line 60) | def step(self, action): method _obfilt (line 73) | def _obfilt(self, obs): method reset (line 81) | def reset(self): class CategoricalMasked (line 201) | class CategoricalMasked(Categorical): method __init__ (line 202) | def __init__(self, probs=None, logits=None, validate_args=None, masks=... method entropy (line 211) | def entropy(self): class Policy (line 218) | class Policy(nn.Module): method __init__ (line 219) | def __init__(self): method forward (line 234) | def forward(self, x): method get_action (line 241) | def get_action(self, x, action=None, invalid_action_masks=None): class Value (line 256) | class Value(nn.Module): method __init__ (line 257) | def __init__(self): method forward (line 272) | def forward(self, x): function discount_cumsum (line 279) | def discount_cumsum(x, dones, gamma): FILE: invalid_action_masking/ppo_no_adj_16x16.py class RunningMeanStd (line 21) | class RunningMeanStd(object): method __init__ (line 22) | def __init__(self, epsilon=1e-4, shape=()): method update (line 27) | def update(self, x): method update_from_moments (line 33) | def update_from_moments(self, batch_mean, batch_var, batch_count): function update_mean_var_count_from_moments (line 37) | def update_mean_var_count_from_moments(mean, var, count, batch_mean, bat... class NormalizedEnv (line 49) | class NormalizedEnv(gym.core.Wrapper): method __init__ (line 50) | def __init__(self, env, ob=True, ret=True, clipob=10., cliprew=10., ga... method step (line 60) | def step(self, action): method _obfilt (line 73) | def _obfilt(self, obs): method reset (line 81) | def reset(self): class CategoricalMasked (line 201) | class CategoricalMasked(Categorical): method __init__ (line 202) | def __init__(self, probs=None, logits=None, validate_args=None, masks=... method entropy (line 211) | def entropy(self): class Policy (line 218) | class Policy(nn.Module): method __init__ (line 219) | def __init__(self): method forward (line 234) | def forward(self, x): method get_action (line 241) | def get_action(self, x, action=None, invalid_action_masks=None): class Value (line 256) | class Value(nn.Module): method __init__ (line 257) | def __init__(self): method forward (line 272) | def forward(self, x): function discount_cumsum (line 279) | def discount_cumsum(x, dones, gamma): FILE: invalid_action_masking/ppo_no_adj_24x24.py class RunningMeanStd (line 21) | class RunningMeanStd(object): method __init__ (line 22) | def __init__(self, epsilon=1e-4, shape=()): method update (line 27) | def update(self, x): method update_from_moments (line 33) | def update_from_moments(self, batch_mean, batch_var, batch_count): function update_mean_var_count_from_moments (line 37) | def update_mean_var_count_from_moments(mean, var, count, batch_mean, bat... class NormalizedEnv (line 49) | class NormalizedEnv(gym.core.Wrapper): method __init__ (line 50) | def __init__(self, env, ob=True, ret=True, clipob=10., cliprew=10., ga... method step (line 60) | def step(self, action): method _obfilt (line 73) | def _obfilt(self, obs): method reset (line 81) | def reset(self): class CategoricalMasked (line 201) | class CategoricalMasked(Categorical): method __init__ (line 202) | def __init__(self, probs=None, logits=None, validate_args=None, masks=... method entropy (line 211) | def entropy(self): class Policy (line 218) | class Policy(nn.Module): method __init__ (line 219) | def __init__(self): method forward (line 234) | def forward(self, x): method get_action (line 241) | def get_action(self, x, action=None, invalid_action_masks=None): class Value (line 256) | class Value(nn.Module): method __init__ (line 257) | def __init__(self): method forward (line 272) | def forward(self, x): function discount_cumsum (line 279) | def discount_cumsum(x, dones, gamma): FILE: invalid_action_masking/ppo_no_adj_4x4.py class RunningMeanStd (line 21) | class RunningMeanStd(object): method __init__ (line 22) | def __init__(self, epsilon=1e-4, shape=()): method update (line 27) | def update(self, x): method update_from_moments (line 33) | def update_from_moments(self, batch_mean, batch_var, batch_count): function update_mean_var_count_from_moments (line 37) | def update_mean_var_count_from_moments(mean, var, count, batch_mean, bat... class NormalizedEnv (line 49) | class NormalizedEnv(gym.core.Wrapper): method __init__ (line 50) | def __init__(self, env, ob=True, ret=True, clipob=10., cliprew=10., ga... method step (line 60) | def step(self, action): method _obfilt (line 73) | def _obfilt(self, obs): method reset (line 81) | def reset(self): class CategoricalMasked (line 201) | class CategoricalMasked(Categorical): method __init__ (line 202) | def __init__(self, probs=None, logits=None, validate_args=None, masks=... method entropy (line 211) | def entropy(self): class Policy (line 218) | class Policy(nn.Module): method __init__ (line 219) | def __init__(self): method forward (line 231) | def forward(self, x): method get_action (line 238) | def get_action(self, x, action=None, invalid_action_masks=None): class Value (line 253) | class Value(nn.Module): method __init__ (line 254) | def __init__(self): method forward (line 266) | def forward(self, x): function discount_cumsum (line 273) | def discount_cumsum(x, dones, gamma): FILE: invalid_action_masking/ppo_no_mask_10x10.py class RunningMeanStd (line 21) | class RunningMeanStd(object): method __init__ (line 22) | def __init__(self, epsilon=1e-4, shape=()): method update (line 27) | def update(self, x): method update_from_moments (line 33) | def update_from_moments(self, batch_mean, batch_var, batch_count): function update_mean_var_count_from_moments (line 37) | def update_mean_var_count_from_moments(mean, var, count, batch_mean, bat... class NormalizedEnv (line 49) | class NormalizedEnv(gym.core.Wrapper): method __init__ (line 50) | def __init__(self, env, ob=True, ret=True, clipob=10., cliprew=10., ga... method step (line 60) | def step(self, action): method _obfilt (line 73) | def _obfilt(self, obs): method reset (line 81) | def reset(self): class CategoricalMasked (line 203) | class CategoricalMasked(Categorical): method __init__ (line 204) | def __init__(self, probs=None, logits=None, validate_args=None, masks=... method entropy (line 213) | def entropy(self): class Policy (line 220) | class Policy(nn.Module): method __init__ (line 221) | def __init__(self): method forward (line 236) | def forward(self, x): method get_action (line 243) | def get_action(self, x, action=None): class Value (line 255) | class Value(nn.Module): method __init__ (line 256) | def __init__(self): method forward (line 271) | def forward(self, x): function discount_cumsum (line 278) | def discount_cumsum(x, dones, gamma): FILE: invalid_action_masking/ppo_no_mask_16x16.py class RunningMeanStd (line 21) | class RunningMeanStd(object): method __init__ (line 22) | def __init__(self, epsilon=1e-4, shape=()): method update (line 27) | def update(self, x): method update_from_moments (line 33) | def update_from_moments(self, batch_mean, batch_var, batch_count): function update_mean_var_count_from_moments (line 37) | def update_mean_var_count_from_moments(mean, var, count, batch_mean, bat... class NormalizedEnv (line 49) | class NormalizedEnv(gym.core.Wrapper): method __init__ (line 50) | def __init__(self, env, ob=True, ret=True, clipob=10., cliprew=10., ga... method step (line 60) | def step(self, action): method _obfilt (line 73) | def _obfilt(self, obs): method reset (line 81) | def reset(self): class CategoricalMasked (line 203) | class CategoricalMasked(Categorical): method __init__ (line 204) | def __init__(self, probs=None, logits=None, validate_args=None, masks=... method entropy (line 213) | def entropy(self): class Policy (line 220) | class Policy(nn.Module): method __init__ (line 221) | def __init__(self): method forward (line 236) | def forward(self, x): method get_action (line 243) | def get_action(self, x, action=None): class Value (line 255) | class Value(nn.Module): method __init__ (line 256) | def __init__(self): method forward (line 271) | def forward(self, x): function discount_cumsum (line 278) | def discount_cumsum(x, dones, gamma): FILE: invalid_action_masking/ppo_no_mask_24x24.py class RunningMeanStd (line 21) | class RunningMeanStd(object): method __init__ (line 22) | def __init__(self, epsilon=1e-4, shape=()): method update (line 27) | def update(self, x): method update_from_moments (line 33) | def update_from_moments(self, batch_mean, batch_var, batch_count): function update_mean_var_count_from_moments (line 37) | def update_mean_var_count_from_moments(mean, var, count, batch_mean, bat... class NormalizedEnv (line 49) | class NormalizedEnv(gym.core.Wrapper): method __init__ (line 50) | def __init__(self, env, ob=True, ret=True, clipob=10., cliprew=10., ga... method step (line 60) | def step(self, action): method _obfilt (line 73) | def _obfilt(self, obs): method reset (line 81) | def reset(self): class CategoricalMasked (line 203) | class CategoricalMasked(Categorical): method __init__ (line 204) | def __init__(self, probs=None, logits=None, validate_args=None, masks=... method entropy (line 213) | def entropy(self): class Policy (line 220) | class Policy(nn.Module): method __init__ (line 221) | def __init__(self): method forward (line 236) | def forward(self, x): method get_action (line 243) | def get_action(self, x, action=None): class Value (line 255) | class Value(nn.Module): method __init__ (line 256) | def __init__(self): method forward (line 271) | def forward(self, x): function discount_cumsum (line 278) | def discount_cumsum(x, dones, gamma): FILE: invalid_action_masking/ppo_no_mask_4x4.py class RunningMeanStd (line 21) | class RunningMeanStd(object): method __init__ (line 22) | def __init__(self, epsilon=1e-4, shape=()): method update (line 27) | def update(self, x): method update_from_moments (line 33) | def update_from_moments(self, batch_mean, batch_var, batch_count): function update_mean_var_count_from_moments (line 37) | def update_mean_var_count_from_moments(mean, var, count, batch_mean, bat... class NormalizedEnv (line 49) | class NormalizedEnv(gym.core.Wrapper): method __init__ (line 50) | def __init__(self, env, ob=True, ret=True, clipob=10., cliprew=10., ga... method step (line 60) | def step(self, action): method _obfilt (line 73) | def _obfilt(self, obs): method reset (line 81) | def reset(self): class CategoricalMasked (line 203) | class CategoricalMasked(Categorical): method __init__ (line 204) | def __init__(self, probs=None, logits=None, validate_args=None, masks=... method entropy (line 213) | def entropy(self): class Policy (line 220) | class Policy(nn.Module): method __init__ (line 221) | def __init__(self): method forward (line 233) | def forward(self, x): method get_action (line 240) | def get_action(self, x, action=None): class Value (line 252) | class Value(nn.Module): method __init__ (line 253) | def __init__(self): method forward (line 265) | def forward(self, x): function discount_cumsum (line 272) | def discount_cumsum(x, dones, gamma): FILE: plots/approx_kl.py function smooth (line 140) | def smooth(scalars, weight): # Weight between 0 and 1 function get_df_for_env (line 158) | def get_df_for_env(gym_id): function export_legend (line 180) | def export_legend(ax, filename="legend.pdf"): function _smooth (line 237) | def _smooth(df): FILE: plots/episode_reward.py function smooth (line 156) | def smooth(scalars, weight): # Weight between 0 and 1 function get_df_for_env (line 174) | def get_df_for_env(gym_id): function export_legend (line 196) | def export_legend(ax, filename="legend.pdf"): function _smooth (line 253) | def _smooth(df): FILE: ppo.py class ImageToPyTorch (line 90) | class ImageToPyTorch(gym.ObservationWrapper): method __init__ (line 91) | def __init__(self, env): method observation (line 101) | def observation(self, observation): class VecPyTorch (line 104) | class VecPyTorch(VecEnvWrapper): method __init__ (line 105) | def __init__(self, venv, device): method reset (line 109) | def reset(self): method step_async (line 114) | def step_async(self, actions): method step_wait (line 118) | def step_wait(self): class MicroRTSStatsRecorder (line 124) | class MicroRTSStatsRecorder(gym.Wrapper): method reset (line 126) | def reset(self, **kwargs): method step (line 131) | def step(self, action): function make_env (line 158) | def make_env(gym_id, seed, idx): class CategoricalMasked (line 181) | class CategoricalMasked(Categorical): method __init__ (line 182) | def __init__(self, probs=None, logits=None, validate_args=None, masks=... method entropy (line 191) | def entropy(self): class Scale (line 198) | class Scale(nn.Module): method __init__ (line 199) | def __init__(self, scale): method forward (line 203) | def forward(self, x): function layer_init (line 206) | def layer_init(layer, std=np.sqrt(2), bias_const=0.0): class Agent (line 211) | class Agent(nn.Module): method __init__ (line 212) | def __init__(self, frames=4): method forward (line 225) | def forward(self, x): method get_action (line 228) | def get_action(self, x, action=None, invalid_action_masks=None): method get_value (line 244) | def get_value(self, x):