swarmrl.trainers.trainer Module API Reference¶

Module for the Trainer parent.

`Trainer` ¶

Parent class for the RL Trainer.

Attributes¶

rl_protocols : list(protocol) A list of RL protocols to use in the simulation. loss : Loss An optimization method to compute the loss and update the model.

Source code in swarmrl/trainers/trainer.py

class Trainer:
    """
    Parent class for the RL Trainer.

    Attributes
    ----------
    rl_protocols : list(protocol)
            A list of RL protocols to use in the simulation.
    loss : Loss
            An optimization method to compute the loss and update the model.
    """

    _engine = None

    @property
    def engine(self):
        """
        Runner engine property.
        """
        return self._engine

    @engine.setter
    def engine(self, value):
        """
        Set the engine value.
        """
        self._engine = value

    def __init__(
        self,
        agents: List[ActorCriticAgent],
    ):
        """
        Constructor for the MLP RL.

        Parameters
        ----------
        agents : list
                A list of RL agents
        loss : Loss
                A loss model to use in the A-C loss computation.
        """
        self.agents = {}

        # Add the protocols to an easily accessible internal dict.
        # TODO: Maybe turn into a dataclass? Not sure if it helps yet.
        for agent in agents:
            self.agents[str(agent.particle_type)] = agent

    def initialize_training(self) -> ForceFunction:
        """
        Return an initialized interaction model.

        Returns
        -------
        interaction_model : ForceFunction
                Interaction model to start the simulation with.
        """

        return ForceFunction(
            agents=self.agents,
        )

    def update_rl(self) -> Tuple[ForceFunction, np.ndarray]:
        """
        Update the RL algorithm.

        Returns
        -------
        interaction_model : MLModel
                Interaction model to use in the next episode.
        reward : np.ndarray
                Current mean episode reward. This is returned for nice progress bars.
        killed : bool
                Whether or not the task has ended the training.
        """
        reward = 0.0  # TODO: Separate between species and optimize visualization.
        switches = []

        for agent in self.agents.values():
            if isinstance(agent, ActorCriticAgent):
                ag_reward, ag_killed = agent.update_agent()
                reward += np.mean(ag_reward)
                switches.append(ag_killed)

        # Create a new interaction model.
        interaction_model = ForceFunction(agents=self.agents)
        return interaction_model, np.array(reward), any(switches)

    def export_models(self, directory: str = "Models"):
        """
        Export the models to the specified directory.

        Parameters
        ----------
        directory : str (default='Models')
                Directory in which to save the models.

        Returns
        -------
        Saves the actor and the critic to the specific directory.
        """
        for agent in self.agents.values():
            agent.save_agent(directory)

    def restore_models(self, directory: str = "Models"):
        """
        Export the models to the specified directory.

        Parameters
        ----------
        directory : str (default='Models')
                Directory from which to load the objects.

        Returns
        -------
        Loads the actor and critic from the specific directory.
        """
        for agent in self.agents.values():
            agent.restore_agent(directory)

    def initialize_models(self):
        """
        Initialize all of the models in the gym.
        """
        for agent in self.agents.values():
            agent.initialize_network()

    def perform_rl_training(self, **kwargs):
        """
        Perform the RL training.

        Parameters
        ----------
        **kwargs
            All arguments related to the specific trainer.
        """
        raise NotImplementedError("Implemented in child class")

`engine` `property` `writable` ¶

Runner engine property.

`init(agents)` ¶

Constructor for the MLP RL.

Parameters¶

agents : list A list of RL agents loss : Loss A loss model to use in the A-C loss computation.

Source code in swarmrl/trainers/trainer.py

def __init__(
    self,
    agents: List[ActorCriticAgent],
):
    """
    Constructor for the MLP RL.

    Parameters
    ----------
    agents : list
            A list of RL agents
    loss : Loss
            A loss model to use in the A-C loss computation.
    """
    self.agents = {}

    # Add the protocols to an easily accessible internal dict.
    # TODO: Maybe turn into a dataclass? Not sure if it helps yet.
    for agent in agents:
        self.agents[str(agent.particle_type)] = agent

`export_models(directory='Models')` ¶

Export the models to the specified directory.

Parameters¶

directory : str (default='Models') Directory in which to save the models.

Returns¶

Saves the actor and the critic to the specific directory.

Source code in swarmrl/trainers/trainer.py

def export_models(self, directory: str = "Models"):
    """
    Export the models to the specified directory.

    Parameters
    ----------
    directory : str (default='Models')
            Directory in which to save the models.

    Returns
    -------
    Saves the actor and the critic to the specific directory.
    """
    for agent in self.agents.values():
        agent.save_agent(directory)

`initialize_models()` ¶

Initialize all of the models in the gym.

Source code in swarmrl/trainers/trainer.py

def initialize_models(self):
    """
    Initialize all of the models in the gym.
    """
    for agent in self.agents.values():
        agent.initialize_network()

`initialize_training()` ¶

Return an initialized interaction model.

Returns¶

interaction_model : ForceFunction Interaction model to start the simulation with.

Source code in swarmrl/trainers/trainer.py

def initialize_training(self) -> ForceFunction:
    """
    Return an initialized interaction model.

    Returns
    -------
    interaction_model : ForceFunction
            Interaction model to start the simulation with.
    """

    return ForceFunction(
        agents=self.agents,
    )

`perform_rl_training(**kwargs)` ¶

Perform the RL training.

Parameters¶

**kwargs All arguments related to the specific trainer.

Source code in swarmrl/trainers/trainer.py

def perform_rl_training(self, **kwargs):
    """
    Perform the RL training.

    Parameters
    ----------
    **kwargs
        All arguments related to the specific trainer.
    """
    raise NotImplementedError("Implemented in child class")

`restore_models(directory='Models')` ¶

Export the models to the specified directory.

Parameters¶

directory : str (default='Models') Directory from which to load the objects.

Returns¶

Loads the actor and critic from the specific directory.

Source code in swarmrl/trainers/trainer.py

def restore_models(self, directory: str = "Models"):
    """
    Export the models to the specified directory.

    Parameters
    ----------
    directory : str (default='Models')
            Directory from which to load the objects.

    Returns
    -------
    Loads the actor and critic from the specific directory.
    """
    for agent in self.agents.values():
        agent.restore_agent(directory)

`update_rl()` ¶

Update the RL algorithm.

Returns¶

interaction_model : MLModel Interaction model to use in the next episode. reward : np.ndarray Current mean episode reward. This is returned for nice progress bars. killed : bool Whether or not the task has ended the training.

Source code in swarmrl/trainers/trainer.py

def update_rl(self) -> Tuple[ForceFunction, np.ndarray]:
    """
    Update the RL algorithm.

    Returns
    -------
    interaction_model : MLModel
            Interaction model to use in the next episode.
    reward : np.ndarray
            Current mean episode reward. This is returned for nice progress bars.
    killed : bool
            Whether or not the task has ended the training.
    """
    reward = 0.0  # TODO: Separate between species and optimize visualization.
    switches = []

    for agent in self.agents.values():
        if isinstance(agent, ActorCriticAgent):
            ag_reward, ag_killed = agent.update_agent()
            reward += np.mean(ag_reward)
            switches.append(ag_killed)

    # Create a new interaction model.
    interaction_model = ForceFunction(agents=self.agents)
    return interaction_model, np.array(reward), any(switches)

swarmrl.trainers.trainer Module API Reference¶

Trainer ¶

Attributes¶

engine property writable ¶

__init__(agents) ¶

Parameters¶

export_models(directory='Models') ¶

Parameters¶

Returns¶

initialize_models() ¶

initialize_training() ¶

Returns¶

perform_rl_training(**kwargs) ¶

Parameters¶

restore_models(directory='Models') ¶

Parameters¶

Returns¶

update_rl() ¶

Returns¶

`Trainer` ¶

`engine` `property` `writable` ¶

`init(agents)` ¶

`export_models(directory='Models')` ¶

`initialize_models()` ¶

`initialize_training()` ¶

`perform_rl_training(**kwargs)` ¶

`restore_models(directory='Models')` ¶

`update_rl()` ¶