Source code for xuance.tensorflow.learners.multi_agent_rl.masacdis_learner

"""
Multi-agent Soft Actor-critic (MASAC) with discrete action spaces.
Implementation: Pytorch
"""
import torch
from torch import nn
from xuance.common import List
from argparse import Namespace
from xuance.torch.learners.multi_agent_rl.isac_learner import ISAC_Learner
from operator import itemgetter


[docs] class MASACDIS_Learner(ISAC_Learner): def __init__(self, config: Namespace, model_keys: List[str], agent_keys: List[str], policy: nn.Module, callback): super(MASACDIS_Learner, self).__init__(config, model_keys, agent_keys, policy, callback)
[docs] def update(self, sample): self.iterations += 1 info = {} self.policy.soft_update(self.tau) return info
[docs] def update_rnn(self, sample): self.iterations += 1 info = {} return info