Tianshou
v0.2.1
Tutorials
Deep Q Network
Basic concepts in Tianshou
Tabular Q Learning Implementation
Train a model-free RL agent within 30s
API Docs
tianshou.data
tianshou.env
tianshou.policy
tianshou.trainer
tianshou.exploration
tianshou.utils
Community
Contributing
Tianshou
Docs
»
Index
Edit on GitHub
Index
_
|
A
|
B
|
C
|
D
|
E
|
G
|
L
|
M
|
O
|
P
|
R
|
S
|
T
|
U
|
V
_
__call__() (tianshou.exploration.OUNoise method)
(tianshou.policy.A2CPolicy method)
(tianshou.policy.BasePolicy method)
(tianshou.policy.DDPGPolicy method)
(tianshou.policy.DQNPolicy method)
(tianshou.policy.PGPolicy method)
(tianshou.policy.PPOPolicy method)
(tianshou.policy.SACPolicy method)
__getitem__() (tianshou.data.Batch method)
(tianshou.data.ReplayBuffer method)
__len__() (tianshou.data.Batch method)
(tianshou.data.ReplayBuffer method)
(tianshou.env.BaseVectorEnv method)
A
A2CPolicy (class in tianshou.policy)
add() (tianshou.data.PrioritizedReplayBuffer method)
(tianshou.data.ReplayBuffer method)
(tianshou.utils.MovAvg method)
append() (tianshou.data.Batch method)
B
BasePolicy (class in tianshou.policy)
BaseVectorEnv (class in tianshou.env)
Batch (class in tianshou.data)
C
close() (tianshou.data.Collector method)
(tianshou.env.BaseVectorEnv method)
(tianshou.env.RayVectorEnv method)
(tianshou.env.SubprocVectorEnv method)
(tianshou.env.VectorEnv method)
collect() (tianshou.data.Collector method)
Collector (class in tianshou.data)
D
DDPGPolicy (class in tianshou.policy)
DQNPolicy (class in tianshou.policy)
E
eval() (tianshou.policy.DDPGPolicy method)
(tianshou.policy.DQNPolicy method)
(tianshou.policy.PPOPolicy method)
(tianshou.policy.SACPolicy method)
(tianshou.policy.TD3Policy method)
G
gather_info() (in module tianshou.trainer)
get() (tianshou.utils.MovAvg method)
get_env_num() (tianshou.data.Collector method)
L
learn() (tianshou.policy.A2CPolicy method)
(tianshou.policy.BasePolicy method)
(tianshou.policy.DDPGPolicy method)
(tianshou.policy.DQNPolicy method)
(tianshou.policy.PGPolicy method)
(tianshou.policy.PPOPolicy method)
(tianshou.policy.SACPolicy method)
(tianshou.policy.TD3Policy method)
ListReplayBuffer (class in tianshou.data)
M
mean() (tianshou.utils.MovAvg method)
module
tianshou.data
tianshou.env
tianshou.exploration
tianshou.policy
tianshou.trainer
tianshou.utils
MovAvg (class in tianshou.utils)
O
offpolicy_trainer() (in module tianshou.trainer)
onpolicy_trainer() (in module tianshou.trainer)
OUNoise (class in tianshou.exploration)
P
PGPolicy (class in tianshou.policy)
PPOPolicy (class in tianshou.policy)
PrioritizedReplayBuffer (class in tianshou.data)
process_fn() (tianshou.policy.BasePolicy method)
(tianshou.policy.DDPGPolicy method)
(tianshou.policy.DQNPolicy method)
(tianshou.policy.PGPolicy method)
R
RayVectorEnv (class in tianshou.env)
render() (tianshou.data.Collector method)
(tianshou.env.BaseVectorEnv method)
(tianshou.env.RayVectorEnv method)
(tianshou.env.SubprocVectorEnv method)
(tianshou.env.VectorEnv method)
ReplayBuffer (class in tianshou.data)
reset() (tianshou.data.ListReplayBuffer method)
(tianshou.data.PrioritizedReplayBuffer method)
(tianshou.data.ReplayBuffer method)
(tianshou.env.BaseVectorEnv method)
(tianshou.env.RayVectorEnv method)
(tianshou.env.SubprocVectorEnv method)
(tianshou.env.VectorEnv method)
(tianshou.exploration.OUNoise method)
reset_buffer() (tianshou.data.Collector method)
reset_env() (tianshou.data.Collector method)
S
SACPolicy (class in tianshou.policy)
sample() (tianshou.data.Collector method)
(tianshou.data.PrioritizedReplayBuffer method)
(tianshou.data.ReplayBuffer method)
seed() (tianshou.data.Collector method)
(tianshou.env.BaseVectorEnv method)
(tianshou.env.RayVectorEnv method)
(tianshou.env.SubprocVectorEnv method)
(tianshou.env.VectorEnv method)
set_eps() (tianshou.policy.DDPGPolicy method)
(tianshou.policy.DQNPolicy method)
split() (tianshou.data.Batch method)
std() (tianshou.utils.MovAvg method)
step() (tianshou.env.BaseVectorEnv method)
(tianshou.env.RayVectorEnv method)
(tianshou.env.SubprocVectorEnv method)
(tianshou.env.VectorEnv method)
SubprocVectorEnv (class in tianshou.env)
sync_weight() (tianshou.policy.DDPGPolicy method)
(tianshou.policy.DQNPolicy method)
(tianshou.policy.PPOPolicy method)
(tianshou.policy.SACPolicy method)
(tianshou.policy.TD3Policy method)
T
TD3Policy (class in tianshou.policy)
test_episode() (in module tianshou.trainer)
tianshou.data
module
tianshou.env
module
tianshou.exploration
module
tianshou.policy
module
tianshou.trainer
module
tianshou.utils
module
train() (tianshou.policy.DDPGPolicy method)
(tianshou.policy.DQNPolicy method)
(tianshou.policy.PPOPolicy method)
(tianshou.policy.SACPolicy method)
(tianshou.policy.TD3Policy method)
U
update() (tianshou.data.ReplayBuffer method)
V
VectorEnv (class in tianshou.env)