SYMBOL INDEX (311 symbols across 17 files)

FILE: gym_vec_api/ppo_multidiscrete.py
  function parse_args (line 17) | def parse_args():
  function make_env (line 81) | def make_env(gym_id, seed, idx, capture_video, run_name):
  function layer_init (line 96) | def layer_init(layer, std=np.sqrt(2), bias_const=0.0):
  class Transpose (line 102) | class Transpose(nn.Module):
    method __init__ (line 103) | def __init__(self, permutation):
    method forward (line 107) | def forward(self, x):
  class Agent (line 111) | class Agent(nn.Module):
    method __init__ (line 112) | def __init__(self, envs):
    method get_value (line 128) | def get_value(self, x):
    method get_action_and_value (line 131) | def get_action_and_value(self, x, action=None):

FILE: gym_vec_api/ppo_multidiscrete_mask.py
  function parse_args (line 17) | def parse_args():
  function make_env (line 81) | def make_env(gym_id, seed, idx, capture_video, run_name):
  function layer_init (line 96) | def layer_init(layer, std=np.sqrt(2), bias_const=0.0):
  class Transpose (line 102) | class Transpose(nn.Module):
    method __init__ (line 103) | def __init__(self, permutation):
    method forward (line 107) | def forward(self, x):
  class CategoricalMasked (line 111) | class CategoricalMasked(Categorical):
    method __init__ (line 112) | def __init__(self, probs=None, logits=None, validate_args=None, masks=...
    method entropy (line 121) | def entropy(self):
  class Agent (line 129) | class Agent(nn.Module):
    method __init__ (line 130) | def __init__(self, envs):
    method get_value (line 146) | def get_value(self, x):
    method get_action_and_value (line 149) | def get_action_and_value(self, x, action_mask, action=None):

FILE: invalid_action_masking/ppo_10x10.py
  class RunningMeanStd (line 21) | class RunningMeanStd(object):
    method __init__ (line 22) | def __init__(self, epsilon=1e-4, shape=()):
    method update (line 27) | def update(self, x):
    method update_from_moments (line 33) | def update_from_moments(self, batch_mean, batch_var, batch_count):
  function update_mean_var_count_from_moments (line 37) | def update_mean_var_count_from_moments(mean, var, count, batch_mean, bat...
  class NormalizedEnv (line 49) | class NormalizedEnv(gym.core.Wrapper):
    method __init__ (line 50) | def __init__(self, env, ob=True, ret=True, clipob=10., cliprew=10., ga...
    method step (line 60) | def step(self, action):
    method _obfilt (line 73) | def _obfilt(self, obs):
    method reset (line 81) | def reset(self):
  class CategoricalMasked (line 201) | class CategoricalMasked(Categorical):
    method __init__ (line 202) | def __init__(self, probs=None, logits=None, validate_args=None, masks=...
    method entropy (line 211) | def entropy(self):
  class Policy (line 218) | class Policy(nn.Module):
    method __init__ (line 219) | def __init__(self):
    method forward (line 234) | def forward(self, x):
    method get_action (line 241) | def get_action(self, x, action=None, invalid_action_masks=None):
  class Value (line 256) | class Value(nn.Module):
    method __init__ (line 257) | def __init__(self):
    method forward (line 272) | def forward(self, x):
  function discount_cumsum (line 279) | def discount_cumsum(x, dones, gamma):
  function evaluate_with_no_mask (line 317) | def evaluate_with_no_mask():

FILE: invalid_action_masking/ppo_16x16.py
  class RunningMeanStd (line 21) | class RunningMeanStd(object):
    method __init__ (line 22) | def __init__(self, epsilon=1e-4, shape=()):
    method update (line 27) | def update(self, x):
    method update_from_moments (line 33) | def update_from_moments(self, batch_mean, batch_var, batch_count):
  function update_mean_var_count_from_moments (line 37) | def update_mean_var_count_from_moments(mean, var, count, batch_mean, bat...
  class NormalizedEnv (line 49) | class NormalizedEnv(gym.core.Wrapper):
    method __init__ (line 50) | def __init__(self, env, ob=True, ret=True, clipob=10., cliprew=10., ga...
    method step (line 60) | def step(self, action):
    method _obfilt (line 73) | def _obfilt(self, obs):
    method reset (line 81) | def reset(self):
  class CategoricalMasked (line 201) | class CategoricalMasked(Categorical):
    method __init__ (line 202) | def __init__(self, probs=None, logits=None, validate_args=None, masks=...
    method entropy (line 211) | def entropy(self):
  class Policy (line 218) | class Policy(nn.Module):
    method __init__ (line 219) | def __init__(self):
    method forward (line 234) | def forward(self, x):
    method get_action (line 241) | def get_action(self, x, action=None, invalid_action_masks=None):
  class Value (line 256) | class Value(nn.Module):
    method __init__ (line 257) | def __init__(self):
    method forward (line 272) | def forward(self, x):
  function discount_cumsum (line 279) | def discount_cumsum(x, dones, gamma):
  function evaluate_with_no_mask (line 317) | def evaluate_with_no_mask():

FILE: invalid_action_masking/ppo_24x24.py
  class RunningMeanStd (line 21) | class RunningMeanStd(object):
    method __init__ (line 22) | def __init__(self, epsilon=1e-4, shape=()):
    method update (line 27) | def update(self, x):
    method update_from_moments (line 33) | def update_from_moments(self, batch_mean, batch_var, batch_count):
  function update_mean_var_count_from_moments (line 37) | def update_mean_var_count_from_moments(mean, var, count, batch_mean, bat...
  class NormalizedEnv (line 49) | class NormalizedEnv(gym.core.Wrapper):
    method __init__ (line 50) | def __init__(self, env, ob=True, ret=True, clipob=10., cliprew=10., ga...
    method step (line 60) | def step(self, action):
    method _obfilt (line 73) | def _obfilt(self, obs):
    method reset (line 81) | def reset(self):
  class CategoricalMasked (line 201) | class CategoricalMasked(Categorical):
    method __init__ (line 202) | def __init__(self, probs=None, logits=None, validate_args=None, masks=...
    method entropy (line 211) | def entropy(self):
  class Policy (line 218) | class Policy(nn.Module):
    method __init__ (line 219) | def __init__(self):
    method forward (line 234) | def forward(self, x):
    method get_action (line 241) | def get_action(self, x, action=None, invalid_action_masks=None):
  class Value (line 256) | class Value(nn.Module):
    method __init__ (line 257) | def __init__(self):
    method forward (line 272) | def forward(self, x):
  function discount_cumsum (line 279) | def discount_cumsum(x, dones, gamma):
  function evaluate_with_no_mask (line 317) | def evaluate_with_no_mask():

FILE: invalid_action_masking/ppo_4x4.py
  class RunningMeanStd (line 21) | class RunningMeanStd(object):
    method __init__ (line 22) | def __init__(self, epsilon=1e-4, shape=()):
    method update (line 27) | def update(self, x):
    method update_from_moments (line 33) | def update_from_moments(self, batch_mean, batch_var, batch_count):
  function update_mean_var_count_from_moments (line 37) | def update_mean_var_count_from_moments(mean, var, count, batch_mean, bat...
  class NormalizedEnv (line 49) | class NormalizedEnv(gym.core.Wrapper):
    method __init__ (line 50) | def __init__(self, env, ob=True, ret=True, clipob=10., cliprew=10., ga...
    method step (line 60) | def step(self, action):
    method _obfilt (line 73) | def _obfilt(self, obs):
    method reset (line 81) | def reset(self):
  class CategoricalMasked (line 201) | class CategoricalMasked(Categorical):
    method __init__ (line 202) | def __init__(self, probs=None, logits=None, validate_args=None, masks=...
    method entropy (line 211) | def entropy(self):
  class Policy (line 218) | class Policy(nn.Module):
    method __init__ (line 219) | def __init__(self):
    method forward (line 230) | def forward(self, x):
    method get_action (line 237) | def get_action(self, x, action=None, invalid_action_masks=None):
  class Value (line 252) | class Value(nn.Module):
    method __init__ (line 253) | def __init__(self):
    method forward (line 265) | def forward(self, x):
  function discount_cumsum (line 272) | def discount_cumsum(x, dones, gamma):
  function evaluate_with_no_mask (line 310) | def evaluate_with_no_mask():

FILE: invalid_action_masking/ppo_no_adj_10x10.py
  class RunningMeanStd (line 21) | class RunningMeanStd(object):
    method __init__ (line 22) | def __init__(self, epsilon=1e-4, shape=()):
    method update (line 27) | def update(self, x):
    method update_from_moments (line 33) | def update_from_moments(self, batch_mean, batch_var, batch_count):
  function update_mean_var_count_from_moments (line 37) | def update_mean_var_count_from_moments(mean, var, count, batch_mean, bat...
  class NormalizedEnv (line 49) | class NormalizedEnv(gym.core.Wrapper):
    method __init__ (line 50) | def __init__(self, env, ob=True, ret=True, clipob=10., cliprew=10., ga...
    method step (line 60) | def step(self, action):
    method _obfilt (line 73) | def _obfilt(self, obs):
    method reset (line 81) | def reset(self):
  class CategoricalMasked (line 201) | class CategoricalMasked(Categorical):
    method __init__ (line 202) | def __init__(self, probs=None, logits=None, validate_args=None, masks=...
    method entropy (line 211) | def entropy(self):
  class Policy (line 218) | class Policy(nn.Module):
    method __init__ (line 219) | def __init__(self):
    method forward (line 234) | def forward(self, x):
    method get_action (line 241) | def get_action(self, x, action=None, invalid_action_masks=None):
  class Value (line 256) | class Value(nn.Module):
    method __init__ (line 257) | def __init__(self):
    method forward (line 272) | def forward(self, x):
  function discount_cumsum (line 279) | def discount_cumsum(x, dones, gamma):

FILE: invalid_action_masking/ppo_no_adj_16x16.py
  class RunningMeanStd (line 21) | class RunningMeanStd(object):
    method __init__ (line 22) | def __init__(self, epsilon=1e-4, shape=()):
    method update (line 27) | def update(self, x):
    method update_from_moments (line 33) | def update_from_moments(self, batch_mean, batch_var, batch_count):
  function update_mean_var_count_from_moments (line 37) | def update_mean_var_count_from_moments(mean, var, count, batch_mean, bat...
  class NormalizedEnv (line 49) | class NormalizedEnv(gym.core.Wrapper):
    method __init__ (line 50) | def __init__(self, env, ob=True, ret=True, clipob=10., cliprew=10., ga...
    method step (line 60) | def step(self, action):
    method _obfilt (line 73) | def _obfilt(self, obs):
    method reset (line 81) | def reset(self):
  class CategoricalMasked (line 201) | class CategoricalMasked(Categorical):
    method __init__ (line 202) | def __init__(self, probs=None, logits=None, validate_args=None, masks=...
    method entropy (line 211) | def entropy(self):
  class Policy (line 218) | class Policy(nn.Module):
    method __init__ (line 219) | def __init__(self):
    method forward (line 234) | def forward(self, x):
    method get_action (line 241) | def get_action(self, x, action=None, invalid_action_masks=None):
  class Value (line 256) | class Value(nn.Module):
    method __init__ (line 257) | def __init__(self):
    method forward (line 272) | def forward(self, x):
  function discount_cumsum (line 279) | def discount_cumsum(x, dones, gamma):

FILE: invalid_action_masking/ppo_no_adj_24x24.py
  class RunningMeanStd (line 21) | class RunningMeanStd(object):
    method __init__ (line 22) | def __init__(self, epsilon=1e-4, shape=()):
    method update (line 27) | def update(self, x):
    method update_from_moments (line 33) | def update_from_moments(self, batch_mean, batch_var, batch_count):
  function update_mean_var_count_from_moments (line 37) | def update_mean_var_count_from_moments(mean, var, count, batch_mean, bat...
  class NormalizedEnv (line 49) | class NormalizedEnv(gym.core.Wrapper):
    method __init__ (line 50) | def __init__(self, env, ob=True, ret=True, clipob=10., cliprew=10., ga...
    method step (line 60) | def step(self, action):
    method _obfilt (line 73) | def _obfilt(self, obs):
    method reset (line 81) | def reset(self):
  class CategoricalMasked (line 201) | class CategoricalMasked(Categorical):
    method __init__ (line 202) | def __init__(self, probs=None, logits=None, validate_args=None, masks=...
    method entropy (line 211) | def entropy(self):
  class Policy (line 218) | class Policy(nn.Module):
    method __init__ (line 219) | def __init__(self):
    method forward (line 234) | def forward(self, x):
    method get_action (line 241) | def get_action(self, x, action=None, invalid_action_masks=None):
  class Value (line 256) | class Value(nn.Module):
    method __init__ (line 257) | def __init__(self):
    method forward (line 272) | def forward(self, x):
  function discount_cumsum (line 279) | def discount_cumsum(x, dones, gamma):

FILE: invalid_action_masking/ppo_no_adj_4x4.py
  class RunningMeanStd (line 21) | class RunningMeanStd(object):
    method __init__ (line 22) | def __init__(self, epsilon=1e-4, shape=()):
    method update (line 27) | def update(self, x):
    method update_from_moments (line 33) | def update_from_moments(self, batch_mean, batch_var, batch_count):
  function update_mean_var_count_from_moments (line 37) | def update_mean_var_count_from_moments(mean, var, count, batch_mean, bat...
  class NormalizedEnv (line 49) | class NormalizedEnv(gym.core.Wrapper):
    method __init__ (line 50) | def __init__(self, env, ob=True, ret=True, clipob=10., cliprew=10., ga...
    method step (line 60) | def step(self, action):
    method _obfilt (line 73) | def _obfilt(self, obs):
    method reset (line 81) | def reset(self):
  class CategoricalMasked (line 201) | class CategoricalMasked(Categorical):
    method __init__ (line 202) | def __init__(self, probs=None, logits=None, validate_args=None, masks=...
    method entropy (line 211) | def entropy(self):
  class Policy (line 218) | class Policy(nn.Module):
    method __init__ (line 219) | def __init__(self):
    method forward (line 231) | def forward(self, x):
    method get_action (line 238) | def get_action(self, x, action=None, invalid_action_masks=None):
  class Value (line 253) | class Value(nn.Module):
    method __init__ (line 254) | def __init__(self):
    method forward (line 266) | def forward(self, x):
  function discount_cumsum (line 273) | def discount_cumsum(x, dones, gamma):

FILE: invalid_action_masking/ppo_no_mask_10x10.py
  class RunningMeanStd (line 21) | class RunningMeanStd(object):
    method __init__ (line 22) | def __init__(self, epsilon=1e-4, shape=()):
    method update (line 27) | def update(self, x):
    method update_from_moments (line 33) | def update_from_moments(self, batch_mean, batch_var, batch_count):
  function update_mean_var_count_from_moments (line 37) | def update_mean_var_count_from_moments(mean, var, count, batch_mean, bat...
  class NormalizedEnv (line 49) | class NormalizedEnv(gym.core.Wrapper):
    method __init__ (line 50) | def __init__(self, env, ob=True, ret=True, clipob=10., cliprew=10., ga...
    method step (line 60) | def step(self, action):
    method _obfilt (line 73) | def _obfilt(self, obs):
    method reset (line 81) | def reset(self):
  class CategoricalMasked (line 203) | class CategoricalMasked(Categorical):
    method __init__ (line 204) | def __init__(self, probs=None, logits=None, validate_args=None, masks=...
    method entropy (line 213) | def entropy(self):
  class Policy (line 220) | class Policy(nn.Module):
    method __init__ (line 221) | def __init__(self):
    method forward (line 236) | def forward(self, x):
    method get_action (line 243) | def get_action(self, x, action=None):
  class Value (line 255) | class Value(nn.Module):
    method __init__ (line 256) | def __init__(self):
    method forward (line 271) | def forward(self, x):
  function discount_cumsum (line 278) | def discount_cumsum(x, dones, gamma):

FILE: invalid_action_masking/ppo_no_mask_16x16.py
  class RunningMeanStd (line 21) | class RunningMeanStd(object):
    method __init__ (line 22) | def __init__(self, epsilon=1e-4, shape=()):
    method update (line 27) | def update(self, x):
    method update_from_moments (line 33) | def update_from_moments(self, batch_mean, batch_var, batch_count):
  function update_mean_var_count_from_moments (line 37) | def update_mean_var_count_from_moments(mean, var, count, batch_mean, bat...
  class NormalizedEnv (line 49) | class NormalizedEnv(gym.core.Wrapper):
    method __init__ (line 50) | def __init__(self, env, ob=True, ret=True, clipob=10., cliprew=10., ga...
    method step (line 60) | def step(self, action):
    method _obfilt (line 73) | def _obfilt(self, obs):
    method reset (line 81) | def reset(self):
  class CategoricalMasked (line 203) | class CategoricalMasked(Categorical):
    method __init__ (line 204) | def __init__(self, probs=None, logits=None, validate_args=None, masks=...
    method entropy (line 213) | def entropy(self):
  class Policy (line 220) | class Policy(nn.Module):
    method __init__ (line 221) | def __init__(self):
    method forward (line 236) | def forward(self, x):
    method get_action (line 243) | def get_action(self, x, action=None):
  class Value (line 255) | class Value(nn.Module):
    method __init__ (line 256) | def __init__(self):
    method forward (line 271) | def forward(self, x):
  function discount_cumsum (line 278) | def discount_cumsum(x, dones, gamma):

FILE: invalid_action_masking/ppo_no_mask_24x24.py
  class RunningMeanStd (line 21) | class RunningMeanStd(object):
    method __init__ (line 22) | def __init__(self, epsilon=1e-4, shape=()):
    method update (line 27) | def update(self, x):
    method update_from_moments (line 33) | def update_from_moments(self, batch_mean, batch_var, batch_count):
  function update_mean_var_count_from_moments (line 37) | def update_mean_var_count_from_moments(mean, var, count, batch_mean, bat...
  class NormalizedEnv (line 49) | class NormalizedEnv(gym.core.Wrapper):
    method __init__ (line 50) | def __init__(self, env, ob=True, ret=True, clipob=10., cliprew=10., ga...
    method step (line 60) | def step(self, action):
    method _obfilt (line 73) | def _obfilt(self, obs):
    method reset (line 81) | def reset(self):
  class CategoricalMasked (line 203) | class CategoricalMasked(Categorical):
    method __init__ (line 204) | def __init__(self, probs=None, logits=None, validate_args=None, masks=...
    method entropy (line 213) | def entropy(self):
  class Policy (line 220) | class Policy(nn.Module):
    method __init__ (line 221) | def __init__(self):
    method forward (line 236) | def forward(self, x):
    method get_action (line 243) | def get_action(self, x, action=None):
  class Value (line 255) | class Value(nn.Module):
    method __init__ (line 256) | def __init__(self):
    method forward (line 271) | def forward(self, x):
  function discount_cumsum (line 278) | def discount_cumsum(x, dones, gamma):

FILE: invalid_action_masking/ppo_no_mask_4x4.py
  class RunningMeanStd (line 21) | class RunningMeanStd(object):
    method __init__ (line 22) | def __init__(self, epsilon=1e-4, shape=()):
    method update (line 27) | def update(self, x):
    method update_from_moments (line 33) | def update_from_moments(self, batch_mean, batch_var, batch_count):
  function update_mean_var_count_from_moments (line 37) | def update_mean_var_count_from_moments(mean, var, count, batch_mean, bat...
  class NormalizedEnv (line 49) | class NormalizedEnv(gym.core.Wrapper):
    method __init__ (line 50) | def __init__(self, env, ob=True, ret=True, clipob=10., cliprew=10., ga...
    method step (line 60) | def step(self, action):
    method _obfilt (line 73) | def _obfilt(self, obs):
    method reset (line 81) | def reset(self):
  class CategoricalMasked (line 203) | class CategoricalMasked(Categorical):
    method __init__ (line 204) | def __init__(self, probs=None, logits=None, validate_args=None, masks=...
    method entropy (line 213) | def entropy(self):
  class Policy (line 220) | class Policy(nn.Module):
    method __init__ (line 221) | def __init__(self):
    method forward (line 233) | def forward(self, x):
    method get_action (line 240) | def get_action(self, x, action=None):
  class Value (line 252) | class Value(nn.Module):
    method __init__ (line 253) | def __init__(self):
    method forward (line 265) | def forward(self, x):
  function discount_cumsum (line 272) | def discount_cumsum(x, dones, gamma):

FILE: plots/approx_kl.py
  function smooth (line 140) | def smooth(scalars, weight):  # Weight between 0 and 1
  function get_df_for_env (line 158) | def get_df_for_env(gym_id):
  function export_legend (line 180) | def export_legend(ax, filename="legend.pdf"):
  function _smooth (line 237) | def _smooth(df):

FILE: plots/episode_reward.py
  function smooth (line 156) | def smooth(scalars, weight):  # Weight between 0 and 1
  function get_df_for_env (line 174) | def get_df_for_env(gym_id):
  function export_legend (line 196) | def export_legend(ax, filename="legend.pdf"):
  function _smooth (line 253) | def _smooth(df):

FILE: ppo.py
  class ImageToPyTorch (line 90) | class ImageToPyTorch(gym.ObservationWrapper):
    method __init__ (line 91) | def __init__(self, env):
    method observation (line 101) | def observation(self, observation):
  class VecPyTorch (line 104) | class VecPyTorch(VecEnvWrapper):
    method __init__ (line 105) | def __init__(self, venv, device):
    method reset (line 109) | def reset(self):
    method step_async (line 114) | def step_async(self, actions):
    method step_wait (line 118) | def step_wait(self):
  class MicroRTSStatsRecorder (line 124) | class MicroRTSStatsRecorder(gym.Wrapper):
    method reset (line 126) | def reset(self, **kwargs):
    method step (line 131) | def step(self, action):
  function make_env (line 158) | def make_env(gym_id, seed, idx):
  class CategoricalMasked (line 181) | class CategoricalMasked(Categorical):
    method __init__ (line 182) | def __init__(self, probs=None, logits=None, validate_args=None, masks=...
    method entropy (line 191) | def entropy(self):
  class Scale (line 198) | class Scale(nn.Module):
    method __init__ (line 199) | def __init__(self, scale):
    method forward (line 203) | def forward(self, x):
  function layer_init (line 206) | def layer_init(layer, std=np.sqrt(2), bias_const=0.0):
  class Agent (line 211) | class Agent(nn.Module):
    method __init__ (line 212) | def __init__(self, frames=4):
    method forward (line 225) | def forward(self, x):
    method get_action (line 228) | def get_action(self, x, action=None, invalid_action_masks=None):
    method get_value (line 244) | def get_value(self, x):