MindSpore
安装部署
安装MindSpore Reinforcement
使用指南
强化学习配置说明
使用MindSpore Reinforcement实现深度Q学习(DQN)
ReplayBuffer 使用说明
API参考
mindspore_rl
RELEASE NOTES
MindSpore Reinforcement Release Notes
MindSpore
»
Index
Index
A
|
B
|
C
|
D
|
E
|
F
|
G
|
I
|
L
|
M
|
N
|
O
|
P
|
R
|
S
|
T
|
U
A
act() (mindspore_rl.agent.Actor method)
(mindspore_rl.agent.Agent method)
act_init() (mindspore_rl.agent.Actor method)
action_space (mindspore_rl.environment.Environment property)
(mindspore_rl.environment.GymEnvironment property)
(mindspore_rl.environment.MsEnvironment property)
(mindspore_rl.environment.MultiEnvironmentWrapper property)
(mindspore_rl.environment.StarCraft2Environment property)
(mindspore_rl.environment.TicTacToeEnvironment property)
B
boundary (mindspore_rl.environment.Space property)
C
calculate_rewards() (mindspore_rl.environment.TicTacToeEnvironment method)
config (mindspore_rl.environment.Environment property)
(mindspore_rl.environment.GymEnvironment property)
(mindspore_rl.environment.MsEnvironment property)
(mindspore_rl.environment.MultiEnvironmentWrapper property)
(mindspore_rl.environment.StarCraft2Environment property)
(mindspore_rl.environment.TicTacToeEnvironment property)
construct() (mindspore_rl.network.FullyConnectedLayers method)
(mindspore_rl.network.FullyConnectedNet method)
(mindspore_rl.network.GruNet method)
(mindspore_rl.policy.EpsilonGreedyPolicy method)
(mindspore_rl.policy.GreedyPolicy method)
(mindspore_rl.policy.Policy method)
(mindspore_rl.policy.RandomPolicy method)
current_player() (mindspore_rl.environment.TicTacToeEnvironment method)
D
destroy() (mindspore_rl.core.PriorityReplayBuffer method)
done_space (mindspore_rl.environment.Environment property)
(mindspore_rl.environment.GymEnvironment property)
(mindspore_rl.environment.MsEnvironment property)
(mindspore_rl.environment.MultiEnvironmentWrapper property)
(mindspore_rl.environment.StarCraft2Environment property)
(mindspore_rl.environment.TicTacToeEnvironment property)
E
evaluate() (mindspore_rl.agent.Actor method)
(mindspore_rl.agent.Trainer method)
F
full() (mindspore_rl.core.ReplayBuffer method)
(mindspore_rl.core.UniformReplayBuffer method)
G
get_action() (mindspore_rl.agent.Actor method)
(mindspore_rl.agent.Agent method)
get_item() (mindspore_rl.core.ReplayBuffer method)
(mindspore_rl.core.UniformReplayBuffer method)
get_replay_buffer() (mindspore_rl.core.MSRL method)
get_replay_buffer_elements() (mindspore_rl.core.MSRL method)
get_step_info() (mindspore_rl.environment.StarCraft2Environment method)
I
init() (mindspore_rl.core.MSRL method)
insert() (mindspore_rl.core.ReplayBuffer method)
(mindspore_rl.core.UniformReplayBuffer method)
is_discrete (mindspore_rl.environment.Space property)
is_terminal() (mindspore_rl.environment.TicTacToeEnvironment method)
L
learn() (mindspore_rl.agent.Agent method)
(mindspore_rl.agent.Learner method)
legal_action() (mindspore_rl.environment.TicTacToeEnvironment method)
load() (mindspore_rl.environment.TicTacToeEnvironment method)
load_and_eval() (mindspore_rl.agent.Trainer method)
M
max_utility() (mindspore_rl.environment.TicTacToeEnvironment method)
mindspore_rl.agent.Actor (built-in class)
mindspore_rl.agent.Agent (built-in class)
mindspore_rl.agent.Learner (built-in class)
mindspore_rl.agent.Trainer (built-in class)
mindspore_rl.core.MSRL (built-in class)
mindspore_rl.core.PriorityReplayBuffer (built-in class)
mindspore_rl.core.Session (built-in class)
mindspore_rl.core.UniformReplayBuffer (built-in class)
mindspore_rl.environment.Environment (built-in class)
mindspore_rl.environment.EnvironmentProcess (built-in class)
mindspore_rl.environment.GymEnvironment (built-in class)
mindspore_rl.environment.MsEnvironment (built-in class)
mindspore_rl.environment.MultiEnvironmentWrapper (built-in class)
mindspore_rl.environment.Space (built-in class)
mindspore_rl.environment.StarCraft2Environment (built-in class)
mindspore_rl.environment.TicTacToeEnvironment (built-in class)
mindspore_rl.network.FullyConnectedLayers (built-in class)
mindspore_rl.network.FullyConnectedNet (built-in class)
mindspore_rl.network.GruNet (built-in class)
mindspore_rl.policy.EpsilonGreedyPolicy (built-in class)
mindspore_rl.policy.GreedyPolicy (built-in class)
mindspore_rl.policy.Policy (built-in class)
mindspore_rl.policy.RandomPolicy (built-in class)
ms_dtype (mindspore_rl.environment.Space property)
N
np_dtype (mindspore_rl.environment.Space property)
num_values (mindspore_rl.environment.Space property)
O
observation_space (mindspore_rl.environment.Environment property)
(mindspore_rl.environment.GymEnvironment property)
(mindspore_rl.environment.MsEnvironment property)
(mindspore_rl.environment.MultiEnvironmentWrapper property)
(mindspore_rl.environment.StarCraft2Environment property)
(mindspore_rl.environment.TicTacToeEnvironment property)
P
push() (mindspore_rl.core.PriorityReplayBuffer method)
R
ReplayBuffer (class in mindspore_rl.core)
reset() (mindspore_rl.core.ReplayBuffer method)
(mindspore_rl.core.UniformReplayBuffer method)
(mindspore_rl.environment.Environment method)
(mindspore_rl.environment.GymEnvironment method)
(mindspore_rl.environment.MsEnvironment method)
(mindspore_rl.environment.MultiEnvironmentWrapper method)
(mindspore_rl.environment.StarCraft2Environment method)
(mindspore_rl.environment.TicTacToeEnvironment method)
reward_space (mindspore_rl.environment.Environment property)
(mindspore_rl.environment.GymEnvironment property)
(mindspore_rl.environment.MsEnvironment property)
(mindspore_rl.environment.MultiEnvironmentWrapper property)
(mindspore_rl.environment.StarCraft2Environment property)
(mindspore_rl.environment.TicTacToeEnvironment property)
run() (mindspore_rl.core.Session method)
(mindspore_rl.environment.EnvironmentProcess method)
S
sample() (mindspore_rl.core.PriorityReplayBuffer method)
(mindspore_rl.core.ReplayBuffer method)
(mindspore_rl.core.UniformReplayBuffer method)
(mindspore_rl.environment.Space method)
save() (mindspore_rl.environment.TicTacToeEnvironment method)
shape (mindspore_rl.environment.Space property)
size() (mindspore_rl.core.ReplayBuffer method)
(mindspore_rl.core.UniformReplayBuffer method)
step() (mindspore_rl.environment.Environment method)
(mindspore_rl.environment.GymEnvironment method)
(mindspore_rl.environment.MsEnvironment method)
(mindspore_rl.environment.MultiEnvironmentWrapper method)
(mindspore_rl.environment.StarCraft2Environment method)
(mindspore_rl.environment.TicTacToeEnvironment method)
T
train() (mindspore_rl.agent.Trainer method)
train_one_episode() (mindspore_rl.agent.Trainer method)
trainable_variables() (mindspore_rl.agent.Trainer method)
U
update_priorities() (mindspore_rl.core.PriorityReplayBuffer method)