'vdac_learner_x(#1)'

agi-brain · Dec 25, 2023 · 61dd9e3 · 61dd9e3
1 parent 4d7fa10
commit 61dd9e3
Showing 1 changed file with 8 additions and 8 deletions.
diff --git a/docs/source/documents/api/learners/marl/vdac.rst b/docs/source/documents/api/learners/marl/vdac.rst
@@ -1,7 +1,7 @@
 VDAC_Learner
 ======================
 
-xxxxxx.
+An implementation of the Value-Decomposition Actor-Critic (VDAC) algorithm.
 
 .. raw:: html
 
@@ -31,7 +31,7 @@ PyTorch
 .. py:function::
   xuance.torch.learners.multi_agent_rl.vdac_learner.VDAC_Learner.lr_decay(i_step)
 
-  xxxxxx.
+  Update the learning rate of the VDAC learner based on the current training step.
 
   :param i_step: The current step.
   :type i_step: int
@@ -41,7 +41,7 @@ PyTorch
 .. py:function::
   xuance.torch.learners.multi_agent_rl.vdac_learner.VDAC_Learner.update(sample)
 
-  xxxxxx.
+  Update the VDAC learner based on the sampled experience from the experience replay buffer.
 
   :param sample: A dictionary contianing necessary experience data that is sampled from experience replay buffer.
   :type sample: dict
@@ -51,7 +51,7 @@ PyTorch
 .. py:function::
   xuance.torch.learners.multi_agent_rl.vdac_learner.VDAC_Learner.update_recurrent(sample)
 
-  xxxxxx.
+  Update the VDAC learner for recurrent architectures based on the sampled experience from the experience replay buffer.
 
   :param sample: A dictionary contianing necessary experience data that is sampled from experience replay buffer.
   :type sample: dict
@@ -84,7 +84,7 @@ TensorFlow
 .. py:function::
   xuance.tensorflow.learners.multi_agent_rl.vdac_learner.VDAC_Learner.lr_decay(i_step)
 
-  xxxxxx.
+  Update the learning rate of the VDAC learner based on the current training step.
 
   :param i_step: The current step.
   :type i_step: int
@@ -94,7 +94,7 @@ TensorFlow
 .. py:function::
   xuance.tensorflow.learners.multi_agent_rl.vdac_learner.VDAC_Learner.update(sample)
 
-  xxxxxx.
+  Update the VDAC learner based on the sampled experience from the experience replay buffer.
 
   :param sample: A dictionary contianing necessary experience data that is sampled from experience replay buffer.
   :type sample: dict
@@ -127,7 +127,7 @@ MindSpore
 .. py:function::
   xuance.mindspore.learners.multi_agent_rl.vdac_learner.VDAC_Learner.lr_decay(i_step)
 
-  xxxxxx.
+  Update the learning rate of the VDAC learner based on the current training step.
 
   :param i_step: The current step.
   :type i_step: int
@@ -137,7 +137,7 @@ MindSpore
 .. py:function::
   xuance.mindspore.learners.multi_agent_rl.vdac_learner.VDAC_Learner.update(sample)
 
-  xxxxxx.
+  Update the VDAC learner for recurrent architectures based on the sampled experience from the experience replay buffer.
 
   :param sample: A dictionary contianing necessary experience data that is sampled from experience replay buffer.
   :type sample: dict