SYMBOL INDEX (162 symbols across 11 files)

FILE: fast_td3/environments/humanoid_bench_env.py
  function make_env (line 17) | def make_env(env_name, rank, render_mode=None, seed=0):
  class HumanoidBenchEnv (line 51) | class HumanoidBenchEnv:
    method __init__ (line 54) | def __init__(self, env_name, num_envs=1, render_mode=None, device=None):
    method reset (line 84) | def reset(self):
    method render (line 92) | def render(self):
    method step (line 98) | def step(self, actions):

FILE: fast_td3/environments/isaaclab_env.py
  class IsaacLabEnv (line 7) | class IsaacLabEnv:
    method __init__ (line 10) | def __init__(
    method reset (line 48) | def reset(self, random_start_init: bool = True) -> torch.Tensor:
    method reset_with_critic_obs (line 57) | def reset_with_critic_obs(self) -> tuple[torch.Tensor, torch.Tensor]:
    method step (line 61) | def step(
    method render (line 80) | def render(self):

FILE: fast_td3/environments/mtbench_env.py
  class MTBenchEnv (line 10) | class MTBenchEnv:
    method __init__ (line 11) | def __init__(
    method reset (line 62) | def reset(self) -> torch.Tensor:
    method step (line 72) | def step(
    method render (line 90) | def render(self):

FILE: fast_td3/environments/mujoco_playground_env.py
  class PlaygroundEvalEnvWrapper (line 8) | class PlaygroundEvalEnvWrapper:
    method __init__ (line 9) | def __init__(
    method reset (line 43) | def reset(self):
    method step (line 51) | def step(self, actions):
    method render_trajectory (line 61) | def render_trajectory(self, trajectory):
  function make_env (line 77) | def make_env(

FILE: fast_td3/fast_td3.py
  class DistributionalQNetwork (line 6) | class DistributionalQNetwork(nn.Module):
    method __init__ (line 7) | def __init__(
    method forward (line 31) | def forward(self, obs: torch.Tensor, actions: torch.Tensor) -> torch.T...
    method projection (line 36) | def projection(
  class Critic (line 84) | class Critic(nn.Module):
    method __init__ (line 85) | def __init__(
    method forward (line 120) | def forward(self, obs: torch.Tensor, actions: torch.Tensor) -> torch.T...
    method projection (line 123) | def projection(
    method get_value (line 152) | def get_value(self, probs: torch.Tensor) -> torch.Tensor:
  class Actor (line 157) | class Actor(nn.Module):
    method __init__ (line 158) | def __init__(
    method forward (line 196) | def forward(self, obs: torch.Tensor) -> torch.Tensor:
    method explore (line 202) | def explore(
  class MultiTaskActor (line 228) | class MultiTaskActor(Actor):
    method __init__ (line 229) | def __init__(self, num_tasks: int, task_embedding_dim: int, *args, **k...
    method forward (line 237) | def forward(self, obs: torch.Tensor) -> torch.Tensor:
  class MultiTaskCritic (line 247) | class MultiTaskCritic(Critic):
    method __init__ (line 248) | def __init__(self, num_tasks: int, task_embedding_dim: int, *args, **k...
    method forward (line 256) | def forward(self, obs: torch.Tensor, actions: torch.Tensor) -> torch.T...
    method projection (line 265) | def projection(

FILE: fast_td3/fast_td3_deploy.py
  class Policy (line 10) | class Policy(nn.Module):
    method __init__ (line 11) | def __init__(
    method forward (line 65) | def forward(self, obs: torch.Tensor) -> torch.Tensor:
    method act (line 71) | def act(self, obs: torch.Tensor) -> torch.distributions.Normal:
  function load_policy (line 76) | def load_policy(checkpoint_path):

FILE: fast_td3/fast_td3_simbav2.py
  function l2normalize (line 7) | def l2normalize(
  class Scaler (line 14) | class Scaler(nn.Module):
    method __init__ (line 19) | def __init__(
    method forward (line 30) | def forward(self, x: torch.Tensor) -> torch.Tensor:
  class HyperDense (line 34) | class HyperDense(nn.Module):
    method __init__ (line 39) | def __init__(self, in_dim: int, hidden_dim: int, device: torch.device ...
    method forward (line 44) | def forward(self, x: torch.Tensor) -> torch.Tensor:
  class HyperMLP (line 48) | class HyperMLP(nn.Module):
    method __init__ (line 53) | def __init__(
    method forward (line 69) | def forward(self, x: torch.Tensor) -> torch.Tensor:
  class HyperEmbedder (line 79) | class HyperEmbedder(nn.Module):
    method __init__ (line 84) | def __init__(
    method forward (line 99) | def forward(self, x: torch.Tensor) -> torch.Tensor:
  class HyperLERPBlock (line 111) | class HyperLERPBlock(nn.Module):
    method __init__ (line 116) | def __init__(
    method forward (line 142) | def forward(self, x: torch.Tensor) -> torch.Tensor:
  class HyperTanhPolicy (line 152) | class HyperTanhPolicy(nn.Module):
    method __init__ (line 157) | def __init__(
    method forward (line 171) | def forward(self, x: torch.Tensor) -> torch.Tensor:
  class HyperCategoricalValue (line 180) | class HyperCategoricalValue(nn.Module):
    method __init__ (line 185) | def __init__(
    method forward (line 199) | def forward(self, x: torch.Tensor) -> torch.Tensor:
  class DistributionalQNetwork (line 206) | class DistributionalQNetwork(nn.Module):
    method __init__ (line 207) | def __init__(
    method forward (line 261) | def forward(self, obs: torch.Tensor, actions: torch.Tensor) -> torch.T...
    method projection (line 268) | def projection(
  class Critic (line 316) | class Critic(nn.Module):
    method __init__ (line 317) | def __init__(
    method forward (line 373) | def forward(self, obs: torch.Tensor, actions: torch.Tensor) -> torch.T...
    method projection (line 376) | def projection(
    method get_value (line 405) | def get_value(self, probs: torch.Tensor) -> torch.Tensor:
  class Actor (line 410) | class Actor(nn.Module):
    method __init__ (line 411) | def __init__(
    method forward (line 471) | def forward(self, obs: torch.Tensor) -> torch.Tensor:
    method explore (line 478) | def explore(
  class MultiTaskActor (line 504) | class MultiTaskActor(Actor):
    method __init__ (line 505) | def __init__(self, num_tasks: int, task_embedding_dim: int, *args, **k...
    method forward (line 513) | def forward(self, obs: torch.Tensor) -> torch.Tensor:
  class MultiTaskCritic (line 523) | class MultiTaskCritic(Critic):
    method __init__ (line 524) | def __init__(self, num_tasks: int, task_embedding_dim: int, *args, **k...
    method forward (line 532) | def forward(self, obs: torch.Tensor, actions: torch.Tensor) -> torch.T...
    method projection (line 541) | def projection(

FILE: fast_td3/fast_td3_utils.py
  class SimpleReplayBuffer (line 12) | class SimpleReplayBuffer(nn.Module):
    method __init__ (line 13) | def __init__(
    method extend (line 90) | def extend(
    method sample (line 125) | def sample(self, batch_size: int):
  class EmpiricalNormalization (line 402) | class EmpiricalNormalization(nn.Module):
    method __init__ (line 405) | def __init__(self, shape, device, eps=1e-2, until=None):
    method mean (line 424) | def mean(self):
    method std (line 428) | def std(self):
    method forward (line 432) | def forward(
    method update (line 448) | def update(self, x):
    method inverse (line 496) | def inverse(self, y):
  class RewardNormalizer (line 500) | class RewardNormalizer(nn.Module):
    method __init__ (line 501) | def __init__(
    method _scale_reward (line 518) | def _scale_reward(self, rewards: torch.Tensor) -> torch.Tensor:
    method update_stats (line 525) | def update_stats(
    method forward (line 540) | def forward(self, rewards: torch.Tensor) -> torch.Tensor:
  class PerTaskEmpiricalNormalization (line 544) | class PerTaskEmpiricalNormalization(nn.Module):
    method __init__ (line 547) | def __init__(
    method forward (line 582) | def forward(
    method update (line 615) | def update(self, x: torch.Tensor, task_ids: torch.Tensor):
  class PerTaskRewardNormalizer (line 656) | class PerTaskRewardNormalizer(nn.Module):
    method __init__ (line 657) | def __init__(
    method _scale_reward (line 684) | def _scale_reward(
    method update_stats (line 706) | def update_stats(
    method forward (line 739) | def forward(self, rewards: torch.Tensor, task_ids: torch.Tensor) -> to...
  function cpu_state (line 750) | def cpu_state(sd):
  function save_params (line 755) | def save_params(
  function get_ddp_state_dict (line 795) | def get_ddp_state_dict(model):
  function load_ddp_state_dict (line 802) | def load_ddp_state_dict(model, state_dict):
  function mark_step (line 811) | def mark_step():

FILE: fast_td3/hyperparams.py
  class BaseArgs (line 7) | class BaseArgs:
  function get_args (line 129) | def get_args():
  class HumanoidBenchArgs (line 205) | class HumanoidBenchArgs(BaseArgs):
  class H1HandReachArgs (line 211) | class H1HandReachArgs(HumanoidBenchArgs):
  class H1HandBalanceSimpleArgs (line 218) | class H1HandBalanceSimpleArgs(HumanoidBenchArgs):
  class H1HandBalanceHardArgs (line 224) | class H1HandBalanceHardArgs(HumanoidBenchArgs):
  class H1HandPoleArgs (line 230) | class H1HandPoleArgs(HumanoidBenchArgs):
  class H1HandTruckArgs (line 236) | class H1HandTruckArgs(HumanoidBenchArgs):
  class H1HandMazeArgs (line 242) | class H1HandMazeArgs(HumanoidBenchArgs):
  class H1HandPushArgs (line 249) | class H1HandPushArgs(HumanoidBenchArgs):
  class H1HandBasketballArgs (line 257) | class H1HandBasketballArgs(HumanoidBenchArgs):
  class H1HandWindowArgs (line 265) | class H1HandWindowArgs(HumanoidBenchArgs):
  class H1HandPackageArgs (line 271) | class H1HandPackageArgs(HumanoidBenchArgs):
  class H1HandTruckArgs (line 278) | class H1HandTruckArgs(HumanoidBenchArgs):
  class MuJoCoPlaygroundArgs (line 285) | class MuJoCoPlaygroundArgs(BaseArgs):
  class MTBenchArgs (line 296) | class MTBenchArgs(BaseArgs):
  class MetaWorldMT10Args (line 310) | class MetaWorldMT10Args(MTBenchArgs):
  class MetaWorldMT50Args (line 321) | class MetaWorldMT50Args(MTBenchArgs):
  class G1JoystickFlatTerrainArgs (line 333) | class G1JoystickFlatTerrainArgs(MuJoCoPlaygroundArgs):
  class G1JoystickRoughTerrainArgs (line 339) | class G1JoystickRoughTerrainArgs(MuJoCoPlaygroundArgs):
  class T1JoystickFlatTerrainArgs (line 345) | class T1JoystickFlatTerrainArgs(MuJoCoPlaygroundArgs):
  class T1JoystickRoughTerrainArgs (line 351) | class T1JoystickRoughTerrainArgs(MuJoCoPlaygroundArgs):
  class T1LowDofJoystickFlatTerrainArgs (line 357) | class T1LowDofJoystickFlatTerrainArgs(MuJoCoPlaygroundArgs):
  class T1LowDofJoystickRoughTerrainArgs (line 363) | class T1LowDofJoystickRoughTerrainArgs(MuJoCoPlaygroundArgs):
  class CheetahRunArgs (line 369) | class CheetahRunArgs(MuJoCoPlaygroundArgs):
  class Go1JoystickFlatTerrainArgs (line 381) | class Go1JoystickFlatTerrainArgs(MuJoCoPlaygroundArgs):
  class Go1JoystickRoughTerrainArgs (line 391) | class Go1JoystickRoughTerrainArgs(MuJoCoPlaygroundArgs):
  class Go1GetupArgs (line 401) | class Go1GetupArgs(MuJoCoPlaygroundArgs):
  class LeapCubeReorientArgs (line 411) | class LeapCubeReorientArgs(MuJoCoPlaygroundArgs):
  class LeapCubeRotateZAxisArgs (line 422) | class LeapCubeRotateZAxisArgs(MuJoCoPlaygroundArgs):
  class IsaacLabArgs (line 433) | class IsaacLabArgs(BaseArgs):
  class IsaacLiftCubeFrankaArgs (line 447) | class IsaacLiftCubeFrankaArgs(IsaacLabArgs):
  class IsaacOpenDrawerFrankaArgs (line 464) | class IsaacOpenDrawerFrankaArgs(IsaacLabArgs):
  class IsaacVelocityFlatH1Args (line 475) | class IsaacVelocityFlatH1Args(IsaacLabArgs):
  class IsaacVelocityFlatG1Args (line 483) | class IsaacVelocityFlatG1Args(IsaacLabArgs):
  class IsaacVelocityRoughH1Args (line 491) | class IsaacVelocityRoughH1Args(IsaacLabArgs):
  class IsaacVelocityRoughG1Args (line 500) | class IsaacVelocityRoughG1Args(IsaacLabArgs):
  class IsaacReposeCubeAllegroDirectArgs (line 509) | class IsaacReposeCubeAllegroDirectArgs(IsaacLabArgs):
  class IsaacReposeCubeShadowDirectArgs (line 517) | class IsaacReposeCubeShadowDirectArgs(IsaacLabArgs):

FILE: fast_td3/train.py
  function main (line 53) | def main():

FILE: fast_td3/train_multigpu.py
  function setup_distributed (line 57) | def setup_distributed(rank: int, world_size: int):
  function main (line 72) | def main(rank: int, world_size: int):