diff --git a/src/primaite/game/policy/rllib.py b/src/primaite/game/policy/rllib.py
index f45b9fd6..fcebf40d 100644
--- a/src/primaite/game/policy/rllib.py
+++ b/src/primaite/game/policy/rllib.py
@@ -2,13 +2,15 @@ from pathlib import Path
 from typing import Literal, Optional, TYPE_CHECKING
 
 from primaite.game.policy.policy import PolicyABC
-from primaite.session.environment import PrimaiteRayEnv
+from primaite.session.environment import PrimaiteRayEnv, PrimaiteRayMARLEnv
 
 if TYPE_CHECKING:
     from primaite.session.session import PrimaiteSession, TrainingOptions
 
 import ray
+from ray import air, tune
 from ray.rllib.algorithms import ppo
+from ray.rllib.algorithms.ppo import PPOConfig
 
 
 class RaySingleAgentPolicy(PolicyABC, identifier="RLLIB_single_agent"):
@@ -54,3 +56,50 @@ class RaySingleAgentPolicy(PolicyABC, identifier="RLLIB_single_agent"):
     def from_config(cls, config: "TrainingOptions", session: "PrimaiteSession") -> "RaySingleAgentPolicy":
         """Create a policy from a config."""
         return cls(session=session, algorithm=config.rl_algorithm, seed=config.seed)
+
+
+class RayMultiAgentPolicy(PolicyABC, identifier="RLLIB_multi_agent"):
+    """Mutli agent RL policy using Ray RLLib."""
+
+    def __init__(self, session: "PrimaiteSession", algorithm: Literal["PPO"], seed: Optional[int] = None):
+        """Initialise multi agent policy wrapper."""
+        super().__init__(session=session)
+
+        self.config = (
+            PPOConfig()
+            .environment(env=PrimaiteRayMARLEnv, env_config={"game": session.game})
+            .rollouts(num_rollout_workers=0)
+            .multi_agent(
+                policies={agent.agent_name for agent in session.game.rl_agents},
+                policy_mapping_fn=lambda agent_id, episode, worker, **kw: agent_id,
+            )
+            .training(train_batch_size=128)
+        )
+
+    def learn(self, n_episodes: int, timesteps_per_episode: int) -> None:
+        """Train the agent."""
+        tune.Tuner(
+            "PPO",
+            run_config=air.RunConfig(
+                stop={"training_iteration": n_episodes * timesteps_per_episode},
+                checkpoint_config=air.CheckpointConfig(checkpoint_frequency=10),
+            ),
+            param_space=self.config,
+        ).fit()
+
+    def load(self, model_path: Path) -> None:
+        """Load policy paramters from a file."""
+        return NotImplemented
+
+    def eval(self, n_episodes: int, deterministic: bool) -> None:
+        """Evaluate trained policy."""
+        return NotImplemented
+
+    def save(self, save_path: Path) -> None:
+        """Save policy parameters to a file."""
+        return NotImplemented
+
+    @classmethod
+    def from_config(cls, config: "TrainingOptions", session: "PrimaiteSession") -> "RayMultiAgentPolicy":
+        """Create policy from config."""
+        return cls(session=session, algorithm=config.rl_algorithm, seed=config.seed)
diff --git a/tests/assets/configs/multi_agent_session.yaml b/tests/assets/configs/multi_agent_session.yaml
new file mode 100644
index 00000000..9d71e093
--- /dev/null
+++ b/tests/assets/configs/multi_agent_session.yaml
@@ -0,0 +1,1166 @@
+training_config:
+  rl_framework: RLLIB_multi_agent
+  rl_algorithm: PPO
+  seed: 333
+  n_learn_episodes: 2
+  n_eval_episodes: 1
+  max_steps_per_episode: 128
+  deterministic_eval: false
+  n_agents: 1
+  agent_references: #not used :(
+    - defender1
+    - defender2
+
+io_settings:
+  save_checkpoints: true
+  checkpoint_interval: 5
+
+
+game:
+  max_episode_length: 128
+  ports:
+  - ARP
+  - DNS
+  - HTTP
+  - POSTGRES_SERVER
+  protocols:
+  - ICMP
+  - TCP
+  - UDP
+
+agents:
+  - ref: client_1_green_user
+    team: GREEN
+    type: GreenWebBrowsingAgent
+    observation_space:
+      type: UC2GreenObservation
+    action_space:
+      action_list:
+        - type: DONOTHING
+        # <not yet implemented>
+        # - type: NODE_LOGON
+        # - type: NODE_LOGOFF
+        # - type: NODE_APPLICATION_EXECUTE
+          # options:
+            # execution_definition:
+              # target_address: arcd.com
+
+      options:
+        nodes:
+        - node_ref: client_2
+        max_folders_per_node: 1
+        max_files_per_folder: 1
+        max_services_per_node: 1
+        max_nics_per_node: 2
+        max_acl_rules: 10
+
+    reward_function:
+      reward_components:
+        - type: DUMMY
+
+    agent_settings:
+      start_step: 5
+      frequency: 4
+      variance: 3
+
+  - ref: client_1_data_manipulation_red_bot
+    team: RED
+    type: RedDatabaseCorruptingAgent
+
+    observation_space:
+      type: UC2RedObservation
+      options:
+        nodes:
+          - node_ref: client_1
+            observations:
+            - logon_status
+            - operating_status
+            services:
+            - service_ref: data_manipulation_bot
+              observations:
+                operating_status
+                health_status
+            folders: {}
+
+    action_space:
+      action_list:
+        - type: DONOTHING
+        #<not yet implemented
+        # - type: NODE_APPLICATION_EXECUTE
+        #   options:
+        #     execution_definition:
+        #       server_ip: 192.168.1.14
+        #       payload: "DROP TABLE IF EXISTS user;"
+        #       success_rate: 80%
+        - type: NODE_FILE_DELETE
+        - type: NODE_FILE_CORRUPT
+        # - type: NODE_FOLDER_DELETE
+        # - type: NODE_FOLDER_CORRUPT
+        - type: NODE_OS_SCAN
+        # - type: NODE_LOGON
+        # - type: NODE_LOGOFF
+      options:
+        nodes:
+        - node_ref: client_1
+        max_folders_per_node: 1
+        max_files_per_folder: 1
+        max_services_per_node: 1
+
+    reward_function:
+      reward_components:
+        - type: DUMMY
+
+    agent_settings: # options specific to this particular agent type, basically args of __init__(self)
+      start_step: 25
+      frequency: 20
+      variance: 5
+
+  - ref: defender1
+    team: BLUE
+    type: ProxyAgent
+
+    observation_space:
+      type: UC2BlueObservation
+      options:
+        num_services_per_node: 1
+        num_folders_per_node: 1
+        num_files_per_folder: 1
+        num_nics_per_node: 2
+        nodes:
+        - node_ref: domain_controller
+          services:
+          - service_ref: domain_controller_dns_server
+        - node_ref: web_server
+          services:
+          - service_ref: web_server_database_client
+        - node_ref: database_server
+          services:
+          - service_ref: database_service
+          folders:
+          - folder_name: database
+            files:
+            - file_name: database.db
+        - node_ref: backup_server
+          # services:
+          # - service_ref: backup_service
+        - node_ref: security_suite
+        - node_ref: client_1
+        - node_ref: client_2
+        links:
+        - link_ref: router_1___switch_1
+        - link_ref: router_1___switch_2
+        - link_ref: switch_1___domain_controller
+        - link_ref: switch_1___web_server
+        - link_ref: switch_1___database_server
+        - link_ref: switch_1___backup_server
+        - link_ref: switch_1___security_suite
+        - link_ref: switch_2___client_1
+        - link_ref: switch_2___client_2
+        - link_ref: switch_2___security_suite
+        acl:
+          options:
+            max_acl_rules: 10
+          router_node_ref: router_1
+          ip_address_order:
+            - node_ref: domain_controller
+              nic_num: 1
+            - node_ref: web_server
+              nic_num: 1
+            - node_ref: database_server
+              nic_num: 1
+            - node_ref: backup_server
+              nic_num: 1
+            - node_ref: security_suite
+              nic_num: 1
+            - node_ref: client_1
+              nic_num: 1
+            - node_ref: client_2
+              nic_num: 1
+            - node_ref: security_suite
+              nic_num: 2
+        ics: null
+
+    action_space:
+      action_list:
+        - type: DONOTHING
+        - type: NODE_SERVICE_SCAN
+        - type: NODE_SERVICE_STOP
+        - type: NODE_SERVICE_START
+        - type: NODE_SERVICE_PAUSE
+        - type: NODE_SERVICE_RESUME
+        - type: NODE_SERVICE_RESTART
+        - type: NODE_SERVICE_DISABLE
+        - type: NODE_SERVICE_ENABLE
+        - type: NODE_FILE_SCAN
+        - type: NODE_FILE_CHECKHASH
+        - type: NODE_FILE_DELETE
+        - type: NODE_FILE_REPAIR
+        - type: NODE_FILE_RESTORE
+        - type: NODE_FOLDER_SCAN
+        - type: NODE_FOLDER_CHECKHASH
+        - type: NODE_FOLDER_REPAIR
+        - type: NODE_FOLDER_RESTORE
+        - type: NODE_OS_SCAN
+        - type: NODE_SHUTDOWN
+        - type: NODE_STARTUP
+        - type: NODE_RESET
+        - type: NETWORK_ACL_ADDRULE
+          options:
+            target_router_ref: router_1
+        - type: NETWORK_ACL_REMOVERULE
+          options:
+            target_router_ref: router_1
+        - type: NETWORK_NIC_ENABLE
+        - type: NETWORK_NIC_DISABLE
+
+      action_map:
+          0:
+            action: DONOTHING
+            options: {}
+          # scan webapp service
+          1:
+            action: NODE_SERVICE_SCAN
+            options:
+              node_id: 2
+              service_id: 1
+          # stop webapp service
+          2:
+            action: NODE_SERVICE_STOP
+            options:
+              node_id: 2
+              service_id: 1
+          # start webapp service
+          3:
+            action: "NODE_SERVICE_START"
+            options:
+                node_id: 2
+                service_id: 1
+          4:
+            action: "NODE_SERVICE_PAUSE"
+            options:
+                node_id: 2
+                service_id: 1
+          5:
+            action: "NODE_SERVICE_RESUME"
+            options:
+                node_id: 2
+                service_id: 1
+          6:
+            action: "NODE_SERVICE_RESTART"
+            options:
+                node_id: 2
+                service_id: 1
+          7:
+            action: "NODE_SERVICE_DISABLE"
+            options:
+                node_id: 2
+                service_id: 1
+          8:
+            action: "NODE_SERVICE_ENABLE"
+            options:
+                node_id: 2
+                service_id: 1
+          9:
+            action: "NODE_FILE_SCAN"
+            options:
+                node_id: 3
+                folder_id: 1
+                file_id: 1
+          10:
+            action: "NODE_FILE_CHECKHASH"
+            options:
+                node_id: 3
+                folder_id: 1
+                file_id: 1
+          11:
+            action: "NODE_FILE_DELETE"
+            options:
+                node_id: 3
+                folder_id: 1
+                file_id: 1
+          12:
+            action: "NODE_FILE_REPAIR"
+            options:
+                node_id: 3
+                folder_id: 1
+                file_id: 1
+          13:
+            action: "NODE_FILE_RESTORE"
+            options:
+                node_id: 3
+                folder_id: 1
+                file_id: 1
+          14:
+            action: "NODE_FOLDER_SCAN"
+            options:
+                node_id: 3
+                folder_id: 1
+          15:
+            action: "NODE_FOLDER_CHECKHASH"
+            options:
+                node_id: 3
+                folder_id: 1
+          16:
+            action: "NODE_FOLDER_REPAIR"
+            options:
+                node_id: 3
+                folder_id: 1
+          17:
+            action: "NODE_FOLDER_RESTORE"
+            options:
+                node_id: 3
+                folder_id: 1
+          18:
+            action: "NODE_OS_SCAN"
+            options:
+                node_id: 3
+          19:
+            action: "NODE_SHUTDOWN"
+            options:
+                node_id: 6
+          20:
+            action: "NODE_STARTUP"
+            options:
+                node_id: 6
+          21:
+            action: "NODE_RESET"
+            options:
+                node_id: 6
+          22:
+            action: "NETWORK_ACL_ADDRULE"
+            options:
+                position: 1
+                permission: 2
+                source_ip_id: 7
+                dest_ip_id: 1
+                source_port_id: 1
+                dest_port_id: 1
+                protocol_id: 1
+          23:
+            action: "NETWORK_ACL_ADDRULE"
+            options:
+                position: 1
+                permission: 2
+                source_ip_id: 8
+                dest_ip_id: 1
+                source_port_id: 1
+                dest_port_id: 1
+                protocol_id: 1
+          24:
+            action: "NETWORK_ACL_ADDRULE"
+            options:
+                position: 1
+                permission: 2
+                source_ip_id: 7
+                dest_ip_id: 3
+                source_port_id: 1
+                dest_port_id: 1
+                protocol_id: 3
+          25:
+            action: "NETWORK_ACL_ADDRULE"
+            options:
+                position: 1
+                permission: 2
+                source_ip_id: 8
+                dest_ip_id: 3
+                source_port_id: 1
+                dest_port_id: 1
+                protocol_id: 3
+          26:
+            action: "NETWORK_ACL_ADDRULE"
+            options:
+                position: 1
+                permission: 2
+                source_ip_id: 7
+                dest_ip_id: 4
+                source_port_id: 1
+                dest_port_id: 1
+                protocol_id: 3
+          27:
+            action: "NETWORK_ACL_ADDRULE"
+            options:
+                position: 1
+                permission: 2
+                source_ip_id: 8
+                dest_ip_id: 4
+                source_port_id: 1
+                dest_port_id: 1
+                protocol_id: 3
+          28:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 0
+          29:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 1
+          30:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 2
+          31:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 3
+          32:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 4
+          33:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 5
+          34:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 6
+          35:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 7
+          36:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 8
+          37:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 9
+          38:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 1
+                nic_id: 1
+          39:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 1
+                nic_id: 1
+          40:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 2
+                nic_id: 1
+          41:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 2
+                nic_id: 1
+          42:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 3
+                nic_id: 1
+          43:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 3
+                nic_id: 1
+          44:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 4
+                nic_id: 1
+          45:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 4
+                nic_id: 1
+          46:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 5
+                nic_id: 1
+          47:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 5
+                nic_id: 1
+          48:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 5
+                nic_id: 2
+          49:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 5
+                nic_id: 2
+          50:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 6
+                nic_id: 1
+          51:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 6
+                nic_id: 1
+          52:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 7
+                nic_id: 1
+          53:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 7
+                nic_id: 1
+
+
+      options:
+        nodes:
+        - node_ref: router_1
+        - node_ref: switch_1
+        - node_ref: switch_2
+        - node_ref: domain_controller
+        - node_ref: web_server
+        - node_ref: database_server
+        - node_ref: backup_server
+        - node_ref: security_suite
+        - node_ref: client_1
+        - node_ref: client_2
+        max_folders_per_node: 2
+        max_files_per_folder: 2
+        max_services_per_node: 2
+        max_nics_per_node: 8
+        max_acl_rules: 10
+
+    reward_function:
+      reward_components:
+        - type: DATABASE_FILE_INTEGRITY
+          weight: 0.5
+          options:
+            node_ref: database_server
+            folder_name: database
+            file_name: database.db
+
+
+        - type: WEB_SERVER_404_PENALTY
+          weight: 0.5
+          options:
+            node_ref: web_server
+            service_ref: web_server_web_service
+
+
+    agent_settings:
+      # ...
+
+  - ref: defender2
+    team: BLUE
+    type: ProxyAgent
+
+    observation_space:
+      type: UC2BlueObservation
+      options:
+        num_services_per_node: 1
+        num_folders_per_node: 1
+        num_files_per_folder: 1
+        num_nics_per_node: 2
+        nodes:
+        - node_ref: domain_controller
+          services:
+          - service_ref: domain_controller_dns_server
+        - node_ref: web_server
+          services:
+          - service_ref: web_server_database_client
+        - node_ref: database_server
+          services:
+          - service_ref: database_service
+          folders:
+          - folder_name: database
+            files:
+            - file_name: database.db
+        - node_ref: backup_server
+          # services:
+          # - service_ref: backup_service
+        - node_ref: security_suite
+        - node_ref: client_1
+        - node_ref: client_2
+        links:
+        - link_ref: router_1___switch_1
+        - link_ref: router_1___switch_2
+        - link_ref: switch_1___domain_controller
+        - link_ref: switch_1___web_server
+        - link_ref: switch_1___database_server
+        - link_ref: switch_1___backup_server
+        - link_ref: switch_1___security_suite
+        - link_ref: switch_2___client_1
+        - link_ref: switch_2___client_2
+        - link_ref: switch_2___security_suite
+        acl:
+          options:
+            max_acl_rules: 10
+          router_node_ref: router_1
+          ip_address_order:
+            - node_ref: domain_controller
+              nic_num: 1
+            - node_ref: web_server
+              nic_num: 1
+            - node_ref: database_server
+              nic_num: 1
+            - node_ref: backup_server
+              nic_num: 1
+            - node_ref: security_suite
+              nic_num: 1
+            - node_ref: client_1
+              nic_num: 1
+            - node_ref: client_2
+              nic_num: 1
+            - node_ref: security_suite
+              nic_num: 2
+        ics: null
+
+    action_space:
+      action_list:
+        - type: DONOTHING
+        - type: NODE_SERVICE_SCAN
+        - type: NODE_SERVICE_STOP
+        - type: NODE_SERVICE_START
+        - type: NODE_SERVICE_PAUSE
+        - type: NODE_SERVICE_RESUME
+        - type: NODE_SERVICE_RESTART
+        - type: NODE_SERVICE_DISABLE
+        - type: NODE_SERVICE_ENABLE
+        - type: NODE_FILE_SCAN
+        - type: NODE_FILE_CHECKHASH
+        - type: NODE_FILE_DELETE
+        - type: NODE_FILE_REPAIR
+        - type: NODE_FILE_RESTORE
+        - type: NODE_FOLDER_SCAN
+        - type: NODE_FOLDER_CHECKHASH
+        - type: NODE_FOLDER_REPAIR
+        - type: NODE_FOLDER_RESTORE
+        - type: NODE_OS_SCAN
+        - type: NODE_SHUTDOWN
+        - type: NODE_STARTUP
+        - type: NODE_RESET
+        - type: NETWORK_ACL_ADDRULE
+          options:
+            target_router_ref: router_1
+        - type: NETWORK_ACL_REMOVERULE
+          options:
+            target_router_ref: router_1
+        - type: NETWORK_NIC_ENABLE
+        - type: NETWORK_NIC_DISABLE
+
+      action_map:
+          0:
+            action: DONOTHING
+            options: {}
+          # scan webapp service
+          1:
+            action: NODE_SERVICE_SCAN
+            options:
+              node_id: 2
+              service_id: 1
+          # stop webapp service
+          2:
+            action: NODE_SERVICE_STOP
+            options:
+              node_id: 2
+              service_id: 1
+          # start webapp service
+          3:
+            action: "NODE_SERVICE_START"
+            options:
+                node_id: 2
+                service_id: 1
+          4:
+            action: "NODE_SERVICE_PAUSE"
+            options:
+                node_id: 2
+                service_id: 1
+          5:
+            action: "NODE_SERVICE_RESUME"
+            options:
+                node_id: 2
+                service_id: 1
+          6:
+            action: "NODE_SERVICE_RESTART"
+            options:
+                node_id: 2
+                service_id: 1
+          7:
+            action: "NODE_SERVICE_DISABLE"
+            options:
+                node_id: 2
+                service_id: 1
+          8:
+            action: "NODE_SERVICE_ENABLE"
+            options:
+                node_id: 2
+                service_id: 1
+          9:
+            action: "NODE_FILE_SCAN"
+            options:
+                node_id: 3
+                folder_id: 1
+                file_id: 1
+          10:
+            action: "NODE_FILE_CHECKHASH"
+            options:
+                node_id: 3
+                folder_id: 1
+                file_id: 1
+          11:
+            action: "NODE_FILE_DELETE"
+            options:
+                node_id: 3
+                folder_id: 1
+                file_id: 1
+          12:
+            action: "NODE_FILE_REPAIR"
+            options:
+                node_id: 3
+                folder_id: 1
+                file_id: 1
+          13:
+            action: "NODE_FILE_RESTORE"
+            options:
+                node_id: 3
+                folder_id: 1
+                file_id: 1
+          14:
+            action: "NODE_FOLDER_SCAN"
+            options:
+                node_id: 3
+                folder_id: 1
+          15:
+            action: "NODE_FOLDER_CHECKHASH"
+            options:
+                node_id: 3
+                folder_id: 1
+          16:
+            action: "NODE_FOLDER_REPAIR"
+            options:
+                node_id: 3
+                folder_id: 1
+          17:
+            action: "NODE_FOLDER_RESTORE"
+            options:
+                node_id: 3
+                folder_id: 1
+          18:
+            action: "NODE_OS_SCAN"
+            options:
+                node_id: 3
+          19:
+            action: "NODE_SHUTDOWN"
+            options:
+                node_id: 6
+          20:
+            action: "NODE_STARTUP"
+            options:
+                node_id: 6
+          21:
+            action: "NODE_RESET"
+            options:
+                node_id: 6
+          22:
+            action: "NETWORK_ACL_ADDRULE"
+            options:
+                position: 1
+                permission: 2
+                source_ip_id: 7
+                dest_ip_id: 1
+                source_port_id: 1
+                dest_port_id: 1
+                protocol_id: 1
+          23:
+            action: "NETWORK_ACL_ADDRULE"
+            options:
+                position: 1
+                permission: 2
+                source_ip_id: 8
+                dest_ip_id: 1
+                source_port_id: 1
+                dest_port_id: 1
+                protocol_id: 1
+          24:
+            action: "NETWORK_ACL_ADDRULE"
+            options:
+                position: 1
+                permission: 2
+                source_ip_id: 7
+                dest_ip_id: 3
+                source_port_id: 1
+                dest_port_id: 1
+                protocol_id: 3
+          25:
+            action: "NETWORK_ACL_ADDRULE"
+            options:
+                position: 1
+                permission: 2
+                source_ip_id: 8
+                dest_ip_id: 3
+                source_port_id: 1
+                dest_port_id: 1
+                protocol_id: 3
+          26:
+            action: "NETWORK_ACL_ADDRULE"
+            options:
+                position: 1
+                permission: 2
+                source_ip_id: 7
+                dest_ip_id: 4
+                source_port_id: 1
+                dest_port_id: 1
+                protocol_id: 3
+          27:
+            action: "NETWORK_ACL_ADDRULE"
+            options:
+                position: 1
+                permission: 2
+                source_ip_id: 8
+                dest_ip_id: 4
+                source_port_id: 1
+                dest_port_id: 1
+                protocol_id: 3
+          28:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 0
+          29:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 1
+          30:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 2
+          31:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 3
+          32:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 4
+          33:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 5
+          34:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 6
+          35:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 7
+          36:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 8
+          37:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 9
+          38:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 1
+                nic_id: 1
+          39:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 1
+                nic_id: 1
+          40:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 2
+                nic_id: 1
+          41:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 2
+                nic_id: 1
+          42:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 3
+                nic_id: 1
+          43:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 3
+                nic_id: 1
+          44:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 4
+                nic_id: 1
+          45:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 4
+                nic_id: 1
+          46:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 5
+                nic_id: 1
+          47:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 5
+                nic_id: 1
+          48:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 5
+                nic_id: 2
+          49:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 5
+                nic_id: 2
+          50:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 6
+                nic_id: 1
+          51:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 6
+                nic_id: 1
+          52:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 7
+                nic_id: 1
+          53:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 7
+                nic_id: 1
+
+
+      options:
+        nodes:
+        - node_ref: router_1
+        - node_ref: switch_1
+        - node_ref: switch_2
+        - node_ref: domain_controller
+        - node_ref: web_server
+        - node_ref: database_server
+        - node_ref: backup_server
+        - node_ref: security_suite
+        - node_ref: client_1
+        - node_ref: client_2
+        max_folders_per_node: 2
+        max_files_per_folder: 2
+        max_services_per_node: 2
+        max_nics_per_node: 8
+        max_acl_rules: 10
+
+    reward_function:
+      reward_components:
+        - type: DATABASE_FILE_INTEGRITY
+          weight: 0.5
+          options:
+            node_ref: database_server
+            folder_name: database
+            file_name: database.db
+
+
+        - type: WEB_SERVER_404_PENALTY
+          weight: 0.5
+          options:
+            node_ref: web_server
+            service_ref: web_server_web_service
+
+
+    agent_settings:
+      # ...
+
+
+
+
+
+simulation:
+  network:
+    nodes:
+
+    - ref: router_1
+      type: router
+      hostname: router_1
+      num_ports: 5
+      ports:
+        1:
+          ip_address: 192.168.1.1
+          subnet_mask: 255.255.255.0
+        2:
+          ip_address: 192.168.1.1
+          subnet_mask: 255.255.255.0
+      acl:
+        0:
+          action: PERMIT
+          src_port: POSTGRES_SERVER
+          dst_port: POSTGRES_SERVER
+        1:
+          action: PERMIT
+          src_port: DNS
+          dst_port: DNS
+        22:
+          action: PERMIT
+          src_port: ARP
+          dst_port: ARP
+        23:
+          action: PERMIT
+          protocol: ICMP
+
+    - ref: switch_1
+      type: switch
+      hostname: switch_1
+      num_ports: 8
+
+    - ref: switch_2
+      type: switch
+      hostname: switch_2
+      num_ports: 8
+
+    - ref: domain_controller
+      type: server
+      hostname: domain_controller
+      ip_address: 192.168.1.10
+      subnet_mask: 255.255.255.0
+      default_gateway: 192.168.1.1
+      services:
+      - ref: domain_controller_dns_server
+        type: DNSServer
+        options:
+          domain_mapping:
+            arcd.com: 192.168.1.12 # web server
+
+    - ref: web_server
+      type: server
+      hostname: web_server
+      ip_address: 192.168.1.12
+      subnet_mask: 255.255.255.0
+      default_gateway: 192.168.1.10
+      dns_server: 192.168.1.10
+      services:
+      - ref: web_server_database_client
+        type: DatabaseClient
+        options:
+          db_server_ip: 192.168.1.14
+      - ref: web_server_web_service
+        type: WebServer
+
+
+    - ref: database_server
+      type: server
+      hostname: database_server
+      ip_address: 192.168.1.14
+      subnet_mask: 255.255.255.0
+      default_gateway: 192.168.1.1
+      dns_server: 192.168.1.10
+      services:
+      - ref: database_service
+        type: DatabaseService
+
+    - ref: backup_server
+      type: server
+      hostname: backup_server
+      ip_address: 192.168.1.16
+      subnet_mask: 255.255.255.0
+      default_gateway: 192.168.1.1
+      dns_server: 192.168.1.10
+      services:
+      - ref: backup_service
+        type: DatabaseBackup
+
+    - ref: security_suite
+      type: server
+      hostname: security_suite
+      ip_address: 192.168.1.110
+      subnet_mask: 255.255.255.0
+      default_gateway: 192.168.1.1
+      dns_server: 192.168.1.10
+      nics:
+        2: # unfortunately this number is currently meaningless, they're just added in order and take up the next available slot
+          ip_address: 192.168.10.110
+          subnet_mask: 255.255.255.0
+
+    - ref: client_1
+      type: computer
+      hostname: client_1
+      ip_address: 192.168.10.21
+      subnet_mask: 255.255.255.0
+      default_gateway: 192.168.10.1
+      dns_server: 192.168.1.10
+      services:
+      - ref: data_manipulation_bot
+        type: DataManipulationBot
+      - ref: client_1_dns_client
+        type: DNSClient
+
+    - ref: client_2
+      type: computer
+      hostname: client_2
+      ip_address: 192.168.10.22
+      subnet_mask: 255.255.255.0
+      default_gateway: 192.168.10.1
+      dns_server: 192.168.1.10
+      applications:
+      - ref: client_2_web_browser
+        type: WebBrowser
+      services:
+      - ref: client_2_dns_client
+        type: DNSClient
+
+    links:
+    - ref: router_1___switch_1
+      endpoint_a_ref: router_1
+      endpoint_a_port: 1
+      endpoint_b_ref: switch_1
+      endpoint_b_port: 8
+    - ref: router_1___switch_2
+      endpoint_a_ref: router_1
+      endpoint_a_port: 2
+      endpoint_b_ref: switch_2
+      endpoint_b_port: 8
+    - ref: switch_1___domain_controller
+      endpoint_a_ref: switch_1
+      endpoint_a_port: 1
+      endpoint_b_ref: domain_controller
+      endpoint_b_port: 1
+    - ref: switch_1___web_server
+      endpoint_a_ref: switch_1
+      endpoint_a_port: 2
+      endpoint_b_ref: web_server
+      endpoint_b_port: 1
+    - ref: switch_1___database_server
+      endpoint_a_ref: switch_1
+      endpoint_a_port: 3
+      endpoint_b_ref: database_server
+      endpoint_b_port: 1
+    - ref: switch_1___backup_server
+      endpoint_a_ref: switch_1
+      endpoint_a_port: 4
+      endpoint_b_ref: backup_server
+      endpoint_b_port: 1
+    - ref: switch_1___security_suite
+      endpoint_a_ref: switch_1
+      endpoint_a_port: 7
+      endpoint_b_ref: security_suite
+      endpoint_b_port: 1
+    - ref: switch_2___client_1
+      endpoint_a_ref: switch_2
+      endpoint_a_port: 1
+      endpoint_b_ref: client_1
+      endpoint_b_port: 1
+    - ref: switch_2___client_2
+      endpoint_a_ref: switch_2
+      endpoint_a_port: 2
+      endpoint_b_ref: client_2
+      endpoint_b_port: 1
+    - ref: switch_2___security_suite
+      endpoint_a_ref: switch_2
+      endpoint_a_port: 7
+      endpoint_b_ref: security_suite
+      endpoint_b_port: 2
diff --git a/tests/e2e_integration_tests/test_primaite_session.py b/tests/e2e_integration_tests/test_primaite_session.py
index 68672b51..25b8998b 100644
--- a/tests/e2e_integration_tests/test_primaite_session.py
+++ b/tests/e2e_integration_tests/test_primaite_session.py
@@ -7,6 +7,7 @@ CFG_PATH = "tests/assets/configs/test_primaite_session.yaml"
 TRAINING_ONLY_PATH = "tests/assets/configs/train_only_primaite_session.yaml"
 EVAL_ONLY_PATH = "tests/assets/configs/eval_only_primaite_session.yaml"
 MISCONFIGURED_PATH = "tests/assets/configs/bad_primaite_session.yaml"
+MULTI_AGENT_PATH = "tests/assets/configs/multi_agent_session.yaml"
 
 
 class TestPrimaiteSession:
@@ -63,6 +64,12 @@ class TestPrimaiteSession:
             session.start_session()
             # TODO: include checks that the model was loaded and that the eval-only session ran
 
+    @pytest.mark.parametrize("temp_primaite_session", [[MULTI_AGENT_PATH]], indirect=True)
+    def test_multi_agent_session(self, temp_primaite_session):
+        """Check that we can run a training session with a multi agent system."""
+        with temp_primaite_session as session:
+            session.start_session()
+
     def test_error_thrown_on_bad_configuration(self):
         with pytest.raises(pydantic.ValidationError):
             session = TempPrimaiteSession.from_config(MISCONFIGURED_PATH)