From 76f134d4ebce861bd3615e16631614c2c77c2553 Mon Sep 17 00:00:00 2001 From: baijinqiu <2522827873@qq.com> Date: Mon, 25 Dec 2023 16:27:03 +0800 Subject: [PATCH] 'MATD3_learner_x(#1)' --- docs/source/documents/api/learners/marl/matd3.rst | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/docs/source/documents/api/learners/marl/matd3.rst b/docs/source/documents/api/learners/marl/matd3.rst index d53fee5e..0d0d5eef 100644 --- a/docs/source/documents/api/learners/marl/matd3.rst +++ b/docs/source/documents/api/learners/marl/matd3.rst @@ -1,7 +1,7 @@ MATD3_Learner ===================================== -xxxxxx. +The implementation of the Multi-Agent Twin Delayed DDPG (MATD3) algorithm. .. raw:: html @@ -35,7 +35,7 @@ PyTorch .. py:function:: xuance.torch.learners.multi_agent_rl.matd3_learner.MATD3_Learner.update(sample) - xxxxxx. + This method performs a single update step for the MATD3 learner based on the given experience sample. :param sample: A dictionary contianing necessary experience data that is sampled from experience replay buffer. :type sample: dict @@ -72,7 +72,7 @@ TensorFlow .. py:function:: xuance.tensorflow.learners.multi_agent_rl.matd3_learner.MATD3_Learner.update(sample) - xxxxxx. + This method performs a single update step for the MATD3 learner based on the given experience sample. :param sample: A dictionary contianing necessary experience data that is sampled from experience replay buffer. :type sample: dict @@ -109,7 +109,7 @@ MindSpore .. py:function:: xuance.mindspore.learners.multi_agent_rl.matd3_learner.MATD3_Learner.update(sample) - xxxxxx. + This method performs a single update step for the MATD3 learner based on the given experience sample. :param sample: A dictionary contianing necessary experience data that is sampled from experience replay buffer. :type sample: dict