diff --git a/src/primaite/config/_package_data/example_config_2_rl_agents.yaml b/src/primaite/config/_package_data/example_config_2_rl_agents.yaml
new file mode 100644
index 00000000..9450c419
--- /dev/null
+++ b/src/primaite/config/_package_data/example_config_2_rl_agents.yaml
@@ -0,0 +1,1164 @@
+training_config:
+  rl_framework: RLLIB_single_agent
+  rl_algorithm: PPO
+  seed: 333
+  n_learn_episodes: 1
+  n_eval_episodes: 5
+  max_steps_per_episode: 256
+  deterministic_eval: false
+  n_agents: 1
+  agent_references:
+    - defender
+
+io_settings:
+  save_checkpoints: true
+  checkpoint_interval: 5
+
+
+game:
+  max_episode_length: 256
+  ports:
+  - ARP
+  - DNS
+  - HTTP
+  - POSTGRES_SERVER
+  protocols:
+  - ICMP
+  - TCP
+  - UDP
+
+agents:
+  - ref: client_1_green_user
+    team: GREEN
+    type: GreenWebBrowsingAgent
+    observation_space:
+      type: UC2GreenObservation
+    action_space:
+      action_list:
+        - type: DONOTHING
+        # <not yet implemented>
+        # - type: NODE_LOGON
+        # - type: NODE_LOGOFF
+        # - type: NODE_APPLICATION_EXECUTE
+          # options:
+            # execution_definition:
+              # target_address: arcd.com
+
+      options:
+        nodes:
+        - node_ref: client_2
+        max_folders_per_node: 1
+        max_files_per_folder: 1
+        max_services_per_node: 1
+        max_nics_per_node: 2
+        max_acl_rules: 10
+
+    reward_function:
+      reward_components:
+        - type: DUMMY
+
+    agent_settings:
+      start_step: 5
+      frequency: 4
+      variance: 3
+
+  - ref: client_1_data_manipulation_red_bot
+    team: RED
+    type: RedDatabaseCorruptingAgent
+
+    observation_space:
+      type: UC2RedObservation
+      options:
+        nodes:
+          - node_ref: client_1
+            observations:
+            - logon_status
+            - operating_status
+            services:
+            - service_ref: data_manipulation_bot
+              observations:
+                operating_status
+                health_status
+            folders: {}
+
+    action_space:
+      action_list:
+        - type: DONOTHING
+        #<not yet implemented
+        # - type: NODE_APPLICATION_EXECUTE
+        #   options:
+        #     execution_definition:
+        #       server_ip: 192.168.1.14
+        #       payload: "DELETE"
+        #       success_rate: 80%
+        - type: NODE_FILE_DELETE
+        - type: NODE_FILE_CORRUPT
+        # - type: NODE_FOLDER_DELETE
+        # - type: NODE_FOLDER_CORRUPT
+        - type: NODE_OS_SCAN
+        # - type: NODE_LOGON
+        # - type: NODE_LOGOFF
+      options:
+        nodes:
+        - node_ref: client_1
+        max_folders_per_node: 1
+        max_files_per_folder: 1
+        max_services_per_node: 1
+
+    reward_function:
+      reward_components:
+        - type: DUMMY
+
+    agent_settings: # options specific to this particular agent type, basically args of __init__(self)
+      start_step: 25
+      frequency: 20
+      variance: 5
+
+  - ref: defender1
+    team: BLUE
+    type: ProxyAgent
+
+    observation_space:
+      type: UC2BlueObservation
+      options:
+        num_services_per_node: 1
+        num_folders_per_node: 1
+        num_files_per_folder: 1
+        num_nics_per_node: 2
+        nodes:
+        - node_ref: domain_controller
+          services:
+          - service_ref: domain_controller_dns_server
+        - node_ref: web_server
+          services:
+          - service_ref: web_server_database_client
+        - node_ref: database_server
+          services:
+          - service_ref: database_service
+          folders:
+          - folder_name: database
+            files:
+            - file_name: database.db
+        - node_ref: backup_server
+          # services:
+          # - service_ref: backup_service
+        - node_ref: security_suite
+        - node_ref: client_1
+        - node_ref: client_2
+        links:
+        - link_ref: router_1___switch_1
+        - link_ref: router_1___switch_2
+        - link_ref: switch_1___domain_controller
+        - link_ref: switch_1___web_server
+        - link_ref: switch_1___database_server
+        - link_ref: switch_1___backup_server
+        - link_ref: switch_1___security_suite
+        - link_ref: switch_2___client_1
+        - link_ref: switch_2___client_2
+        - link_ref: switch_2___security_suite
+        acl:
+          options:
+            max_acl_rules: 10
+          router_node_ref: router_1
+          ip_address_order:
+            - node_ref: domain_controller
+              nic_num: 1
+            - node_ref: web_server
+              nic_num: 1
+            - node_ref: database_server
+              nic_num: 1
+            - node_ref: backup_server
+              nic_num: 1
+            - node_ref: security_suite
+              nic_num: 1
+            - node_ref: client_1
+              nic_num: 1
+            - node_ref: client_2
+              nic_num: 1
+            - node_ref: security_suite
+              nic_num: 2
+        ics: null
+
+    action_space:
+      action_list:
+        - type: DONOTHING
+        - type: NODE_SERVICE_SCAN
+        - type: NODE_SERVICE_STOP
+        - type: NODE_SERVICE_START
+        - type: NODE_SERVICE_PAUSE
+        - type: NODE_SERVICE_RESUME
+        - type: NODE_SERVICE_RESTART
+        - type: NODE_SERVICE_DISABLE
+        - type: NODE_SERVICE_ENABLE
+        - type: NODE_FILE_SCAN
+        - type: NODE_FILE_CHECKHASH
+        - type: NODE_FILE_DELETE
+        - type: NODE_FILE_REPAIR
+        - type: NODE_FILE_RESTORE
+        - type: NODE_FOLDER_SCAN
+        - type: NODE_FOLDER_CHECKHASH
+        - type: NODE_FOLDER_REPAIR
+        - type: NODE_FOLDER_RESTORE
+        - type: NODE_OS_SCAN
+        - type: NODE_SHUTDOWN
+        - type: NODE_STARTUP
+        - type: NODE_RESET
+        - type: NETWORK_ACL_ADDRULE
+          options:
+            target_router_ref: router_1
+        - type: NETWORK_ACL_REMOVERULE
+          options:
+            target_router_ref: router_1
+        - type: NETWORK_NIC_ENABLE
+        - type: NETWORK_NIC_DISABLE
+
+      action_map:
+          0:
+            action: DONOTHING
+            options: {}
+          # scan webapp service
+          1:
+            action: NODE_SERVICE_SCAN
+            options:
+              node_id: 2
+              service_id: 1
+          # stop webapp service
+          2:
+            action: NODE_SERVICE_STOP
+            options:
+              node_id: 2
+              service_id: 1
+          # start webapp service
+          3:
+            action: "NODE_SERVICE_START"
+            options:
+                node_id: 2
+                service_id: 1
+          4:
+            action: "NODE_SERVICE_PAUSE"
+            options:
+                node_id: 2
+                service_id: 1
+          5:
+            action: "NODE_SERVICE_RESUME"
+            options:
+                node_id: 2
+                service_id: 1
+          6:
+            action: "NODE_SERVICE_RESTART"
+            options:
+                node_id: 2
+                service_id: 1
+          7:
+            action: "NODE_SERVICE_DISABLE"
+            options:
+                node_id: 2
+                service_id: 1
+          8:
+            action: "NODE_SERVICE_ENABLE"
+            options:
+                node_id: 2
+                service_id: 1
+          9:
+            action: "NODE_FILE_SCAN"
+            options:
+                node_id: 3
+                folder_id: 1
+                file_id: 1
+          10:
+            action: "NODE_FILE_CHECKHASH"
+            options:
+                node_id: 3
+                folder_id: 1
+                file_id: 1
+          11:
+            action: "NODE_FILE_DELETE"
+            options:
+                node_id: 3
+                folder_id: 1
+                file_id: 1
+          12:
+            action: "NODE_FILE_REPAIR"
+            options:
+                node_id: 3
+                folder_id: 1
+                file_id: 1
+          13:
+            action: "NODE_FILE_RESTORE"
+            options:
+                node_id: 3
+                folder_id: 1
+                file_id: 1
+          14:
+            action: "NODE_FOLDER_SCAN"
+            options:
+                node_id: 3
+                folder_id: 1
+          15:
+            action: "NODE_FOLDER_CHECKHASH"
+            options:
+                node_id: 3
+                folder_id: 1
+          16:
+            action: "NODE_FOLDER_REPAIR"
+            options:
+                node_id: 3
+                folder_id: 1
+          17:
+            action: "NODE_FOLDER_RESTORE"
+            options:
+                node_id: 3
+                folder_id: 1
+          18:
+            action: "NODE_OS_SCAN"
+            options:
+                node_id: 3
+          19:
+            action: "NODE_SHUTDOWN"
+            options:
+                node_id: 6
+          20:
+            action: "NODE_STARTUP"
+            options:
+                node_id: 6
+          21:
+            action: "NODE_RESET"
+            options:
+                node_id: 6
+          22:
+            action: "NETWORK_ACL_ADDRULE"
+            options:
+                position: 1
+                permission: 2
+                source_ip_id: 7
+                dest_ip_id: 1
+                source_port_id: 1
+                dest_port_id: 1
+                protocol_id: 1
+          23:
+            action: "NETWORK_ACL_ADDRULE"
+            options:
+                position: 1
+                permission: 2
+                source_ip_id: 8
+                dest_ip_id: 1
+                source_port_id: 1
+                dest_port_id: 1
+                protocol_id: 1
+          24:
+            action: "NETWORK_ACL_ADDRULE"
+            options:
+                position: 1
+                permission: 2
+                source_ip_id: 7
+                dest_ip_id: 3
+                source_port_id: 1
+                dest_port_id: 1
+                protocol_id: 3
+          25:
+            action: "NETWORK_ACL_ADDRULE"
+            options:
+                position: 1
+                permission: 2
+                source_ip_id: 8
+                dest_ip_id: 3
+                source_port_id: 1
+                dest_port_id: 1
+                protocol_id: 3
+          26:
+            action: "NETWORK_ACL_ADDRULE"
+            options:
+                position: 1
+                permission: 2
+                source_ip_id: 7
+                dest_ip_id: 4
+                source_port_id: 1
+                dest_port_id: 1
+                protocol_id: 3
+          27:
+            action: "NETWORK_ACL_ADDRULE"
+            options:
+                position: 1
+                permission: 2
+                source_ip_id: 8
+                dest_ip_id: 4
+                source_port_id: 1
+                dest_port_id: 1
+                protocol_id: 3
+          28:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 0
+          29:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 1
+          30:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 2
+          31:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 3
+          32:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 4
+          33:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 5
+          34:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 6
+          35:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 7
+          36:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 8
+          37:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 9
+          38:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 1
+                nic_id: 1
+          39:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 1
+                nic_id: 1
+          40:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 2
+                nic_id: 1
+          41:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 2
+                nic_id: 1
+          42:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 3
+                nic_id: 1
+          43:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 3
+                nic_id: 1
+          44:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 4
+                nic_id: 1
+          45:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 4
+                nic_id: 1
+          46:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 5
+                nic_id: 1
+          47:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 5
+                nic_id: 1
+          48:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 5
+                nic_id: 2
+          49:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 5
+                nic_id: 2
+          50:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 6
+                nic_id: 1
+          51:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 6
+                nic_id: 1
+          52:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 7
+                nic_id: 1
+          53:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 7
+                nic_id: 1
+
+
+      options:
+        nodes:
+        - node_ref: router_1
+        - node_ref: switch_1
+        - node_ref: switch_2
+        - node_ref: domain_controller
+        - node_ref: web_server
+        - node_ref: database_server
+        - node_ref: backup_server
+        - node_ref: security_suite
+        - node_ref: client_1
+        - node_ref: client_2
+        max_folders_per_node: 2
+        max_files_per_folder: 2
+        max_services_per_node: 2
+        max_nics_per_node: 8
+        max_acl_rules: 10
+
+    reward_function:
+      reward_components:
+        - type: DATABASE_FILE_INTEGRITY
+          weight: 0.5
+          options:
+            node_ref: database_server
+            folder_name: database
+            file_name: database.db
+
+
+        - type: WEB_SERVER_404_PENALTY
+          weight: 0.5
+          options:
+            node_ref: web_server
+            service_ref: web_server_web_service
+
+
+    agent_settings:
+      # ...
+  - ref: defender2
+    team: BLUE
+    type: ProxyAgent
+
+    observation_space:
+      type: UC2BlueObservation
+      options:
+        num_services_per_node: 1
+        num_folders_per_node: 1
+        num_files_per_folder: 1
+        num_nics_per_node: 2
+        nodes:
+        - node_ref: domain_controller
+          services:
+          - service_ref: domain_controller_dns_server
+        - node_ref: web_server
+          services:
+          - service_ref: web_server_database_client
+        - node_ref: database_server
+          services:
+          - service_ref: database_service
+          folders:
+          - folder_name: database
+            files:
+            - file_name: database.db
+        - node_ref: backup_server
+          # services:
+          # - service_ref: backup_service
+        - node_ref: security_suite
+        - node_ref: client_1
+        - node_ref: client_2
+        links:
+        - link_ref: router_1___switch_1
+        - link_ref: router_1___switch_2
+        - link_ref: switch_1___domain_controller
+        - link_ref: switch_1___web_server
+        - link_ref: switch_1___database_server
+        - link_ref: switch_1___backup_server
+        - link_ref: switch_1___security_suite
+        - link_ref: switch_2___client_1
+        - link_ref: switch_2___client_2
+        - link_ref: switch_2___security_suite
+        acl:
+          options:
+            max_acl_rules: 10
+          router_node_ref: router_1
+          ip_address_order:
+            - node_ref: domain_controller
+              nic_num: 1
+            - node_ref: web_server
+              nic_num: 1
+            - node_ref: database_server
+              nic_num: 1
+            - node_ref: backup_server
+              nic_num: 1
+            - node_ref: security_suite
+              nic_num: 1
+            - node_ref: client_1
+              nic_num: 1
+            - node_ref: client_2
+              nic_num: 1
+            - node_ref: security_suite
+              nic_num: 2
+        ics: null
+
+    action_space:
+      action_list:
+        - type: DONOTHING
+        - type: NODE_SERVICE_SCAN
+        - type: NODE_SERVICE_STOP
+        - type: NODE_SERVICE_START
+        - type: NODE_SERVICE_PAUSE
+        - type: NODE_SERVICE_RESUME
+        - type: NODE_SERVICE_RESTART
+        - type: NODE_SERVICE_DISABLE
+        - type: NODE_SERVICE_ENABLE
+        - type: NODE_FILE_SCAN
+        - type: NODE_FILE_CHECKHASH
+        - type: NODE_FILE_DELETE
+        - type: NODE_FILE_REPAIR
+        - type: NODE_FILE_RESTORE
+        - type: NODE_FOLDER_SCAN
+        - type: NODE_FOLDER_CHECKHASH
+        - type: NODE_FOLDER_REPAIR
+        - type: NODE_FOLDER_RESTORE
+        - type: NODE_OS_SCAN
+        - type: NODE_SHUTDOWN
+        - type: NODE_STARTUP
+        - type: NODE_RESET
+        - type: NETWORK_ACL_ADDRULE
+          options:
+            target_router_ref: router_1
+        - type: NETWORK_ACL_REMOVERULE
+          options:
+            target_router_ref: router_1
+        - type: NETWORK_NIC_ENABLE
+        - type: NETWORK_NIC_DISABLE
+
+      action_map:
+          0:
+            action: DONOTHING
+            options: {}
+          # scan webapp service
+          1:
+            action: NODE_SERVICE_SCAN
+            options:
+              node_id: 2
+              service_id: 1
+          # stop webapp service
+          2:
+            action: NODE_SERVICE_STOP
+            options:
+              node_id: 2
+              service_id: 1
+          # start webapp service
+          3:
+            action: "NODE_SERVICE_START"
+            options:
+                node_id: 2
+                service_id: 1
+          4:
+            action: "NODE_SERVICE_PAUSE"
+            options:
+                node_id: 2
+                service_id: 1
+          5:
+            action: "NODE_SERVICE_RESUME"
+            options:
+                node_id: 2
+                service_id: 1
+          6:
+            action: "NODE_SERVICE_RESTART"
+            options:
+                node_id: 2
+                service_id: 1
+          7:
+            action: "NODE_SERVICE_DISABLE"
+            options:
+                node_id: 2
+                service_id: 1
+          8:
+            action: "NODE_SERVICE_ENABLE"
+            options:
+                node_id: 2
+                service_id: 1
+          9:
+            action: "NODE_FILE_SCAN"
+            options:
+                node_id: 3
+                folder_id: 1
+                file_id: 1
+          10:
+            action: "NODE_FILE_CHECKHASH"
+            options:
+                node_id: 3
+                folder_id: 1
+                file_id: 1
+          11:
+            action: "NODE_FILE_DELETE"
+            options:
+                node_id: 3
+                folder_id: 1
+                file_id: 1
+          12:
+            action: "NODE_FILE_REPAIR"
+            options:
+                node_id: 3
+                folder_id: 1
+                file_id: 1
+          13:
+            action: "NODE_FILE_RESTORE"
+            options:
+                node_id: 3
+                folder_id: 1
+                file_id: 1
+          14:
+            action: "NODE_FOLDER_SCAN"
+            options:
+                node_id: 3
+                folder_id: 1
+          15:
+            action: "NODE_FOLDER_CHECKHASH"
+            options:
+                node_id: 3
+                folder_id: 1
+          16:
+            action: "NODE_FOLDER_REPAIR"
+            options:
+                node_id: 3
+                folder_id: 1
+          17:
+            action: "NODE_FOLDER_RESTORE"
+            options:
+                node_id: 3
+                folder_id: 1
+          18:
+            action: "NODE_OS_SCAN"
+            options:
+                node_id: 3
+          19:
+            action: "NODE_SHUTDOWN"
+            options:
+                node_id: 6
+          20:
+            action: "NODE_STARTUP"
+            options:
+                node_id: 6
+          21:
+            action: "NODE_RESET"
+            options:
+                node_id: 6
+          22:
+            action: "NETWORK_ACL_ADDRULE"
+            options:
+                position: 1
+                permission: 2
+                source_ip_id: 7
+                dest_ip_id: 1
+                source_port_id: 1
+                dest_port_id: 1
+                protocol_id: 1
+          23:
+            action: "NETWORK_ACL_ADDRULE"
+            options:
+                position: 1
+                permission: 2
+                source_ip_id: 8
+                dest_ip_id: 1
+                source_port_id: 1
+                dest_port_id: 1
+                protocol_id: 1
+          24:
+            action: "NETWORK_ACL_ADDRULE"
+            options:
+                position: 1
+                permission: 2
+                source_ip_id: 7
+                dest_ip_id: 3
+                source_port_id: 1
+                dest_port_id: 1
+                protocol_id: 3
+          25:
+            action: "NETWORK_ACL_ADDRULE"
+            options:
+                position: 1
+                permission: 2
+                source_ip_id: 8
+                dest_ip_id: 3
+                source_port_id: 1
+                dest_port_id: 1
+                protocol_id: 3
+          26:
+            action: "NETWORK_ACL_ADDRULE"
+            options:
+                position: 1
+                permission: 2
+                source_ip_id: 7
+                dest_ip_id: 4
+                source_port_id: 1
+                dest_port_id: 1
+                protocol_id: 3
+          27:
+            action: "NETWORK_ACL_ADDRULE"
+            options:
+                position: 1
+                permission: 2
+                source_ip_id: 8
+                dest_ip_id: 4
+                source_port_id: 1
+                dest_port_id: 1
+                protocol_id: 3
+          28:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 0
+          29:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 1
+          30:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 2
+          31:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 3
+          32:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 4
+          33:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 5
+          34:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 6
+          35:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 7
+          36:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 8
+          37:
+            action: "NETWORK_ACL_REMOVERULE"
+            options:
+                position: 9
+          38:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 1
+                nic_id: 1
+          39:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 1
+                nic_id: 1
+          40:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 2
+                nic_id: 1
+          41:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 2
+                nic_id: 1
+          42:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 3
+                nic_id: 1
+          43:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 3
+                nic_id: 1
+          44:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 4
+                nic_id: 1
+          45:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 4
+                nic_id: 1
+          46:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 5
+                nic_id: 1
+          47:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 5
+                nic_id: 1
+          48:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 5
+                nic_id: 2
+          49:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 5
+                nic_id: 2
+          50:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 6
+                nic_id: 1
+          51:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 6
+                nic_id: 1
+          52:
+            action: "NETWORK_NIC_DISABLE"
+            options:
+                node_id: 7
+                nic_id: 1
+          53:
+            action: "NETWORK_NIC_ENABLE"
+            options:
+                node_id: 7
+                nic_id: 1
+
+
+      options:
+        nodes:
+        - node_ref: router_1
+        - node_ref: switch_1
+        - node_ref: switch_2
+        - node_ref: domain_controller
+        - node_ref: web_server
+        - node_ref: database_server
+        - node_ref: backup_server
+        - node_ref: security_suite
+        - node_ref: client_1
+        - node_ref: client_2
+        max_folders_per_node: 2
+        max_files_per_folder: 2
+        max_services_per_node: 2
+        max_nics_per_node: 8
+        max_acl_rules: 10
+
+    reward_function:
+      reward_components:
+        - type: DATABASE_FILE_INTEGRITY
+          weight: 0.5
+          options:
+            node_ref: database_server
+            folder_name: database
+            file_name: database.db
+
+
+        - type: WEB_SERVER_404_PENALTY
+          weight: 0.5
+          options:
+            node_ref: web_server
+            service_ref: web_server_web_service
+
+
+    agent_settings:
+      # ...
+
+
+
+
+
+simulation:
+  network:
+    nodes:
+
+    - ref: router_1
+      type: router
+      hostname: router_1
+      num_ports: 5
+      ports:
+        1:
+          ip_address: 192.168.1.1
+          subnet_mask: 255.255.255.0
+        2:
+          ip_address: 192.168.1.1
+          subnet_mask: 255.255.255.0
+      acl:
+        0:
+          action: PERMIT
+          src_port: POSTGRES_SERVER
+          dst_port: POSTGRES_SERVER
+        1:
+          action: PERMIT
+          src_port: DNS
+          dst_port: DNS
+        22:
+          action: PERMIT
+          src_port: ARP
+          dst_port: ARP
+        23:
+          action: PERMIT
+          protocol: ICMP
+
+    - ref: switch_1
+      type: switch
+      hostname: switch_1
+      num_ports: 8
+
+    - ref: switch_2
+      type: switch
+      hostname: switch_2
+      num_ports: 8
+
+    - ref: domain_controller
+      type: server
+      hostname: domain_controller
+      ip_address: 192.168.1.10
+      subnet_mask: 255.255.255.0
+      default_gateway: 192.168.1.1
+      services:
+      - ref: domain_controller_dns_server
+        type: DNSServer
+        options:
+          domain_mapping:
+            arcd.com: 192.168.1.12 # web server
+
+    - ref: web_server
+      type: server
+      hostname: web_server
+      ip_address: 192.168.1.12
+      subnet_mask: 255.255.255.0
+      default_gateway: 192.168.1.10
+      dns_server: 192.168.1.10
+      services:
+      - ref: web_server_database_client
+        type: DatabaseClient
+        options:
+          db_server_ip: 192.168.1.14
+      - ref: web_server_web_service
+        type: WebServer
+
+
+    - ref: database_server
+      type: server
+      hostname: database_server
+      ip_address: 192.168.1.14
+      subnet_mask: 255.255.255.0
+      default_gateway: 192.168.1.1
+      dns_server: 192.168.1.10
+      services:
+      - ref: database_service
+        type: DatabaseService
+
+    - ref: backup_server
+      type: server
+      hostname: backup_server
+      ip_address: 192.168.1.16
+      subnet_mask: 255.255.255.0
+      default_gateway: 192.168.1.1
+      dns_server: 192.168.1.10
+      services:
+      - ref: backup_service
+        type: DatabaseBackup
+
+    - ref: security_suite
+      type: server
+      hostname: security_suite
+      ip_address: 192.168.1.110
+      subnet_mask: 255.255.255.0
+      default_gateway: 192.168.1.1
+      dns_server: 192.168.1.10
+      nics:
+        2: # unfortunately this number is currently meaningless, they're just added in order and take up the next available slot
+          ip_address: 192.168.10.110
+          subnet_mask: 255.255.255.0
+
+    - ref: client_1
+      type: computer
+      hostname: client_1
+      ip_address: 192.168.10.21
+      subnet_mask: 255.255.255.0
+      default_gateway: 192.168.10.1
+      dns_server: 192.168.1.10
+      services:
+      - ref: data_manipulation_bot
+        type: DataManipulationBot
+      - ref: client_1_dns_client
+        type: DNSClient
+
+    - ref: client_2
+      type: computer
+      hostname: client_2
+      ip_address: 192.168.10.22
+      subnet_mask: 255.255.255.0
+      default_gateway: 192.168.10.1
+      dns_server: 192.168.1.10
+      applications:
+      - ref: client_2_web_browser
+        type: WebBrowser
+      services:
+      - ref: client_2_dns_client
+        type: DNSClient
+
+    links:
+    - ref: router_1___switch_1
+      endpoint_a_ref: router_1
+      endpoint_a_port: 1
+      endpoint_b_ref: switch_1
+      endpoint_b_port: 8
+    - ref: router_1___switch_2
+      endpoint_a_ref: router_1
+      endpoint_a_port: 2
+      endpoint_b_ref: switch_2
+      endpoint_b_port: 8
+    - ref: switch_1___domain_controller
+      endpoint_a_ref: switch_1
+      endpoint_a_port: 1
+      endpoint_b_ref: domain_controller
+      endpoint_b_port: 1
+    - ref: switch_1___web_server
+      endpoint_a_ref: switch_1
+      endpoint_a_port: 2
+      endpoint_b_ref: web_server
+      endpoint_b_port: 1
+    - ref: switch_1___database_server
+      endpoint_a_ref: switch_1
+      endpoint_a_port: 3
+      endpoint_b_ref: database_server
+      endpoint_b_port: 1
+    - ref: switch_1___backup_server
+      endpoint_a_ref: switch_1
+      endpoint_a_port: 4
+      endpoint_b_ref: backup_server
+      endpoint_b_port: 1
+    - ref: switch_1___security_suite
+      endpoint_a_ref: switch_1
+      endpoint_a_port: 7
+      endpoint_b_ref: security_suite
+      endpoint_b_port: 1
+    - ref: switch_2___client_1
+      endpoint_a_ref: switch_2
+      endpoint_a_port: 1
+      endpoint_b_ref: client_1
+      endpoint_b_port: 1
+    - ref: switch_2___client_2
+      endpoint_a_ref: switch_2
+      endpoint_a_port: 2
+      endpoint_b_ref: client_2
+      endpoint_b_port: 1
+    - ref: switch_2___security_suite
+      endpoint_a_ref: switch_2
+      endpoint_a_port: 7
+      endpoint_b_ref: security_suite
+      endpoint_b_port: 2
diff --git a/src/primaite/game/environment.py b/src/primaite/game/environment.py
index 8ddcb88a..db24db60 100644
--- a/src/primaite/game/environment.py
+++ b/src/primaite/game/environment.py
@@ -1,7 +1,8 @@
-from typing import Any, Dict, Optional, SupportsFloat, Tuple
+from typing import Any, Dict, Final, Optional, SupportsFloat, Tuple
 
 import gymnasium
 from gymnasium.core import ActType, ObsType
+from ray.rllib.env.multi_agent_env import MultiAgentEnv
 
 from primaite.game.agent.interface import ProxyAgent
 from primaite.game.game import PrimaiteGame
@@ -86,3 +87,76 @@ class PrimaiteRayEnv(gymnasium.Env):
     def step(self, action: ActType) -> Tuple[ObsType, SupportsFloat, bool, bool, Dict]:
         """Perform a step in the environment."""
         return self.env.step(action)
+
+
+class PrimaiteRayMARLEnv(MultiAgentEnv):
+    """Ray Environment that inherits from MultiAgentEnv to allow training MARL systems."""
+
+    def __init__(self, env_config: Optional[Dict] = None) -> None:
+        """Initialise the environment.
+
+        :param env_config: A dictionary containing the environment configuration. It must contain a single key, `game`
+            which is the PrimaiteGame instance.
+        :type env_config: Dict[str, PrimaiteGame]
+        """
+        self.game: PrimaiteGame = env_config["game"]
+        """Reference to the primaite game"""
+        self.agents: Final[Dict[str, ProxyAgent]] = {agent.agent_name: agent for agent in self.game.rl_agents}
+        """List of all possible agents in the environment. This list should not change!"""
+        self._agent_ids = list(self.agents.keys())
+
+        self.terminateds = set()
+        self.truncateds = set()
+        self.observation_space = gymnasium.spaces.Dict(
+            {name: agent.observation_manager.space for name, agent in self.agents.items()}
+        )
+        self.action_space = gymnasium.spaces.Dict(
+            {name: agent.action_manager.space for name, agent in self.agents.items()}
+        )
+        super().__init__()
+
+    def reset(self, *, seed: int = None, options: dict = None) -> Tuple[ObsType, Dict]:
+        """Reset the environment."""
+        self.game.reset()
+        state = self.game.get_sim_state()
+        self.game.update_agents(state)
+        next_obs = self._get_obs()
+        info = {}
+        return next_obs, info
+
+    def step(
+        self, actions: Dict[str, ActType]
+    ) -> Tuple[Dict[str, ObsType], Dict[str, SupportsFloat], Dict[str, bool], Dict[str, bool], Dict]:
+        """Perform a step in the environment. Adherent to Ray MultiAgentEnv step API.
+
+        :param actions: Dict of actions. The key is agent identifier and the value is a gymnasium action instance.
+        :type actions: Dict[str, ActType]
+        :return: Observations, rewards, terminateds, truncateds, and info. Each one is a dictionary keyed by agent
+            identifier.
+        :rtype: Tuple[Dict[str,ObsType], Dict[str, SupportsFloat], Dict[str,bool], Dict[str,bool], Dict]
+        """
+        # 1. Perform actions
+        for agent_name, action in actions.items():
+            self.agents[agent_name].store_action(action)
+        self.game.apply_agent_actions()
+
+        # 2. Advance timestep
+        self.game.advance_timestep()
+
+        # 3. Get next observations
+        state = self.game.get_sim_state()
+        self.game.update_agents(state)
+        next_obs = self._get_obs()
+
+        # 4. Get rewards
+        rewards = {name: agent.reward_function.current_reward for name, agent in self.agents.items()}
+        terminateds = {name: False for name, _ in self.agents.items()}
+        truncateds = {name: self.game.calculate_truncated() for name, _ in self.agents.items()}
+        infos = {}
+        terminateds["__all__"] = len(self.terminateds) == len(self.agents)
+        truncateds["__all__"] = self.game.calculate_truncated()
+        return next_obs, rewards, terminateds, truncateds, infos
+
+    def _get_obs(self) -> Dict[str, ObsType]:
+        """Return the current observation."""
+        return {name: agent.observation_manager.current_observation for name, agent in self.agents.items()}
diff --git a/src/primaite/notebooks/training_example_ray_multi_agent.ipynb b/src/primaite/notebooks/training_example_ray_multi_agent.ipynb
new file mode 100644
index 00000000..9f916af9
--- /dev/null
+++ b/src/primaite/notebooks/training_example_ray_multi_agent.ipynb
@@ -0,0 +1,127 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from primaite.game.game import PrimaiteGame\n",
+    "import yaml\n",
+    "from primaite.config.load import example_config_path\n",
+    "\n",
+    "from primaite.game.environment import PrimaiteRayEnv"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "with open(example_config_path(), 'r') as f:\n",
+    "    cfg = yaml.safe_load(f)\n",
+    "\n",
+    "game = PrimaiteGame.from_config(cfg)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# gym = PrimaiteRayEnv({\"game\":game})"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import ray\n",
+    "from ray import air, tune\n",
+    "from ray.rllib.algorithms.ppo import PPOConfig"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "ray.shutdown()\n",
+    "ray.init()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from primaite.game.environment import PrimaiteRayMARLEnv\n",
+    "\n",
+    "\n",
+    "env_config = {\"game\":game}\n",
+    "config = (\n",
+    "    PPOConfig()\n",
+    "    .environment(env=PrimaiteRayMARLEnv, env_config={\"game\":game})\n",
+    "    .rollouts(num_rollout_workers=0)\n",
+    "    .multi_agent(\n",
+    "        policies={agent.agent_name for agent in game.rl_agents},\n",
+    "        policy_mapping_fn=lambda agent_id, episode, worker, **kw: agent_id,\n",
+    "        )\n",
+    "    .training(train_batch_size=128)\n",
+    "    )\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "tune.Tuner(\n",
+    "    \"PPO\",\n",
+    "    run_config=air.RunConfig(\n",
+    "        stop={\"training_iteration\": 128},\n",
+    "        checkpoint_config=air.CheckpointConfig(\n",
+    "            checkpoint_frequency=10,\n",
+    "        ),\n",
+    "    ),\n",
+    "    param_space=config\n",
+    ").fit()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "venv",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.10.12"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}