SYMBOL INDEX (132 symbols across 6 files) FILE: CartPole-A3C.py class Brain (line 44) | class Brain: method __init__ (line 48) | def __init__(self): method _build_model (line 61) | def _build_model(self): method _build_graph (line 74) | def _build_graph(self, model): method optimize (line 95) | def optimize(self): method train_push (line 121) | def train_push(self, s, a, r, s_): method predict (line 134) | def predict(self, s): method predict_p (line 139) | def predict_p(self, s): method predict_v (line 144) | def predict_v(self, s): class Agent (line 151) | class Agent: method __init__ (line 152) | def __init__(self, eps_start, eps_end, eps_steps): method getEpsilon (line 160) | def getEpsilon(self): method act (line 166) | def act(self, s): method train (line 182) | def train(self, s, a, r, s_): class Environment (line 217) | class Environment(threading.Thread): method __init__ (line 220) | def __init__(self, render=False, eps_start=EPS_START, eps_end=EPS_STOP... method runEpisode (line 227) | def runEpisode(self): method run (line 252) | def run(self): method stop (line 256) | def stop(self): class Optimizer (line 260) | class Optimizer(threading.Thread): method __init__ (line 263) | def __init__(self): method run (line 266) | def run(self): method stop (line 270) | def stop(self): FILE: CartPole-DQN.py function huber_loss (line 22) | def huber_loss(y_true, y_pred): class Brain (line 38) | class Brain: method __init__ (line 39) | def __init__(self, stateCnt, actionCnt): method _createModel (line 46) | def _createModel(self): method train (line 57) | def train(self, x, y, epochs=1, verbose=0): method predict (line 60) | def predict(self, s, target=False): method predictOne (line 66) | def predictOne(self, s, target=False): method updateTargetModel (line 69) | def updateTargetModel(self): class Memory (line 73) | class Memory: # stored as ( s, a, r, s_ ) method __init__ (line 76) | def __init__(self, capacity): method add (line 79) | def add(self, sample): method sample (line 85) | def sample(self, n): method isFull (line 89) | def isFull(self): class Agent (line 104) | class Agent: method __init__ (line 108) | def __init__(self, stateCnt, actionCnt): method act (line 115) | def act(self, s): method observe (line 121) | def observe(self, sample): # in (s, a, r, s_) format method replay (line 138) | def replay(self): class RandomAgent (line 169) | class RandomAgent: method __init__ (line 172) | def __init__(self, actionCnt): method act (line 175) | def act(self, s): method observe (line 178) | def observe(self, sample): # in (s, a, r, s_) format method replay (line 181) | def replay(self): class Environment (line 185) | class Environment: method __init__ (line 186) | def __init__(self, problem): method run (line 190) | def run(self, agent): FILE: CartPole-basic.py class Brain (line 24) | class Brain: method __init__ (line 25) | def __init__(self, stateCnt, actionCnt): method _createModel (line 32) | def _createModel(self): method train (line 43) | def train(self, x, y, epoch=1, verbose=0): method predict (line 46) | def predict(self, s): method predictOne (line 49) | def predictOne(self, s): class Memory (line 53) | class Memory: # stored as ( s, a, r, s_ ) method __init__ (line 56) | def __init__(self, capacity): method add (line 59) | def add(self, sample): method sample (line 65) | def sample(self, n): class Agent (line 79) | class Agent: method __init__ (line 83) | def __init__(self, stateCnt, actionCnt): method act (line 90) | def act(self, s): method observe (line 96) | def observe(self, sample): # in (s, a, r, s_) format method replay (line 103) | def replay(self): class Environment (line 134) | class Environment: method __init__ (line 135) | def __init__(self, problem): method run (line 139) | def run(self, agent): FILE: MountainCar-basic.py function printQ (line 24) | def printQ(agent): function mapBrain (line 41) | def mapBrain(brain, res): function displayBrain (line 55) | def displayBrain(brain, res=50): class Brain (line 83) | class Brain: method __init__ (line 84) | def __init__(self, stateCnt, actionCnt): method _createModel (line 91) | def _createModel(self): method train (line 102) | def train(self, x, y, epoch=1, verbose=0): method predict (line 105) | def predict(self, s): method predictOne (line 108) | def predictOne(self, s): class Memory (line 112) | class Memory: # stored as ( s, a, r, s_ ) method __init__ (line 115) | def __init__(self, capacity): method add (line 118) | def add(self, sample): method sample (line 124) | def sample(self, n): method isFull (line 128) | def isFull(self): class Agent (line 141) | class Agent: method __init__ (line 145) | def __init__(self, stateCnt, actionCnt): method act (line 152) | def act(self, s): method observe (line 158) | def observe(self, sample): # in (s, a, r, s_) format method replay (line 172) | def replay(self): class RandomAgent (line 202) | class RandomAgent: method __init__ (line 205) | def __init__(self, actionCnt): method act (line 208) | def act(self, s): method observe (line 211) | def observe(self, sample): # in (s, a, r, s_) format method replay (line 214) | def replay(self): class Environment (line 218) | class Environment: method __init__ (line 219) | def __init__(self, problem): method normalize (line 229) | def normalize(self, s): method run (line 232) | def run(self, agent): FILE: Seaquest-DDQN-PER.py function huber_loss (line 23) | def huber_loss(y_true, y_pred): function processImage (line 34) | def processImage( img ): class Brain (line 48) | class Brain: method __init__ (line 49) | def __init__(self, stateCnt, actionCnt): method _createModel (line 56) | def _createModel(self): method train (line 72) | def train(self, x, y, epochs=1, verbose=0): method predict (line 75) | def predict(self, s, target=False): method predictOne (line 81) | def predictOne(self, s, target=False): method updateTargetModel (line 84) | def updateTargetModel(self): class Memory (line 88) | class Memory: # stored as ( s, a, r, s_ ) in SumTree method __init__ (line 92) | def __init__(self, capacity): method _getPriority (line 95) | def _getPriority(self, error): method add (line 98) | def add(self, error, sample): method sample (line 102) | def sample(self, n): method update (line 116) | def update(self, idx, error): class Agent (line 135) | class Agent: method __init__ (line 139) | def __init__(self, stateCnt, actionCnt): method act (line 146) | def act(self, s): method observe (line 152) | def observe(self, sample): # in (s, a, r, s_) format method _getTargets (line 163) | def _getTargets(self, batch): method replay (line 195) | def replay(self): class RandomAgent (line 206) | class RandomAgent: method __init__ (line 210) | def __init__(self, actionCnt): method act (line 213) | def act(self, s): method observe (line 216) | def observe(self, sample): # in (s, a, r, s_) format method replay (line 221) | def replay(self): class Environment (line 225) | class Environment: method __init__ (line 226) | def __init__(self, problem): method run (line 230) | def run(self, agent): FILE: SumTree.py class SumTree (line 3) | class SumTree: method __init__ (line 6) | def __init__(self, capacity): method _propagate (line 11) | def _propagate(self, idx, change): method _retrieve (line 19) | def _retrieve(self, idx, s): method total (line 31) | def total(self): method add (line 34) | def add(self, p, data): method update (line 44) | def update(self, idx, p): method get (line 50) | def get(self, s):