added aquarium and mas emergence

2024-11-10 10:58:59 +01:00 · 2024-11-10 10:58:59 +01:00 · b35f19a925
commit b35f19a925
parent 64ba429c49
14 changed files with 73 additions and 15 deletions
--- a/_bibliography.bib
+++ b/_bibliography.bib
@ -213,3 +213,19 @@ organization={Conference on Artificial Life - Alife 2023},
  journal={arXiv preprint arXiv:2301.07420},
  year={2023}
 }
+
+@inproceedings{altmann2024emergence,
+  title={Emergence in Multi-agent Systems: A Safety Perspective},
+  author={Altmann, Philipp and Schönberger, Julian and Illium, Steffen and Zorn, Maximilian and Ritz, Fabian and Haider, Tom and Burton, Simon and Gabor, Thomas},
+  booktitle={International Symposium on Leveraging Applications of Formal Methods},
+  pages={104--120},
+  year={2024},
+  organization={Springer Nature Switzerland Cham}
+}
+
+@article{kolle2024aquarium,
+  title={Aquarium: A Comprehensive Framework for Exploring Predator-Prey Dynamics through Multi-Agent Reinforcement Learning Algorithms},
+  author={Kölle, Michael and Erpelding, Yannick and Ritz, Fabian and Phan, Thomy and Illium, Steffen and Linnhoff-Popien, Claudia},
+  journal={arXiv preprint arXiv:2401.07056},
+  year={2024}
+}
--- a/_config.yml
+++ b/_config.yml
@ -21,7 +21,7 @@ locale                   : "en-US"
 title                    : "Steffen Illium"
 title_separator          : "---"
 subtitle                 : " " # site tagline that appears below site title in masthead
-name                     : Steffen Illium
+name                     : Dr. Steffen Illium
 description              : "Personal Website"
 url                      : "https://steffenillium.de" # the base hostname & protocol for your site e.g. "https://mmistakes.github.io"
 baseurl                  : "" # the subpath of your site, e.g. "/blog"
@ -57,9 +57,9 @@ social:

 # Site Author
 author:
-  name             : "Steffen Illium"
+  name             : "Dr. Steffen Illium"
  avatar           : "/assets/images/newshot_2.jpg" # path of avatar image, e.g. "/assets/images/bio-photo.jpg"
-  bio              : "[AI Researcher](/research/) and [Lecturer](/teaching/), [PHD Student](https://www.mobile.ifi.lmu.de/team/steffen-illium/) @ [LMU Munich](https://www.lmu.de/en/index.html)"
+  bio              : "Senior AI Consultant @[XITASO](https://xitaso.com), [AI Researcher](/research/) [PhD](https://www.mobile.ifi.lmu.de/team/steffen-illium/) by [LMU Munich](https://www.lmu.de/en/index.html)"
  location         : "Augsburg"
  links:
    - label: "LMU-Munich"
--- a/_posts/research/2024-01-13-aquarium.md
+++ b/_posts/research/2024-01-13-aquarium.md
@ -0,0 +1,18 @@
+---
+layout: single
+title:  "Aquarium"
+categories: research MARL reinforcement-learning multi-agent
+excerpt: "Exploring Predator-Prey Dynamics"
+header:
+  teaser: assets/figures/20_aquarium.png
+---
+
+![Multi-Agent Reinforcement Learning Cycle](\assets\figures\20_aquarium.png){:style="display:block; width:40%" .align-right}
+Recent advances in multi-agent reinforcement learning have enabled the modeling of complex interactions between agents in simulated environments. In particular, predator-prey dynamics have garnered significant interest, and various simulations have been adapted to meet unique requirements. To avoid further time-intensive development efforts, we introduce *Aquarium*, a versatile multi-agent reinforcement learning environment designed for studying predator-prey interactions and emergent behavior. *Aquarium* is open-source and seamlessly integrates with the PettingZoo framework, allowing for a quick start using established algorithm implementations. It features physics-based agent movement on a two-dimensional, edge-wrapping plane. Both the agent-environment interactions (observations, actions, rewards) and environmental parameters (agent speed, prey reproduction, predator starvation, and more) are fully customizable. In addition to providing a resource-efficient visualization, *Aquarium* supports video recording, facilitating a visual understanding of agent behavior. 
+
+To showcase the environment's capabilities, we conducted preliminary studies using proximal policy optimization (PPO) to train multiple prey agents to evade a predator. Consistent with existing literature, we found that individual learning leads to worse performance, while parameter sharing significantly improves coordination and sample efficiency.
+{% cite kolle2024aquarium %}
+
+![Construction of the Observation Vector](\assets\figures\20_capture_statistics.png){:style="display:block; width:70%" .align-center}
+
+![Average captures and rewards per prey agent](\assets\figures\20_observation_vector.png){:style="display:block; width:70%" .align-center}
--- a/_posts/research/2024-10-27-emergence-mas.md
+++ b/_posts/research/2024-10-27-emergence-mas.md
@ -0,0 +1,18 @@
+---
+layout: single
+title:  "MAS Emergence"
+categories: research multi-agent reinforcement-learning safety emergence 
+excerpt: "A Safety Perspective"
+header:
+  teaser: assets/figures/21_coins_teaser.png
+---
+
+![Evaluation Environments](\assets\figures\21_envs.png){:style="display:block; width:40%" .align-right}
+Emergent effects can occur in multi-agent systems (MAS), where decision-making is decentralized and based on local information. These effects may range from minor deviations in behavior to catastrophic system failures. To formally define these phenomena, we identify misalignments between the global inherent specification (the true specification) and its local approximation (e.g., the configuration of distinct reward components or observations). Leveraging established safety concepts, we develop a framework for understanding these emergent effects. To demonstrate the resulting implications, we examine two highly configurable gridworld scenarios, where inadequate specifications lead to unintended behavior deviations when derived independently. Acknowledging that a global solution may not always be practical, we propose adjusting the underlying parameterizations to mitigate these issues, thereby improving system alignment and reducing the risk of emergent failures.
+{% cite altmann2024emergence %}
+
+![Instances of emergent behavior](\assets\figures\21_coins.png){:style="display:block; width:70%" .align-center}
+
+![Blocking behavior](\assets\figures\21_blocking.png){:style="display:block; width:70%" .align-center}
+
+
--- a/assets/figures/20_aquarium.png
+++ b/assets/figures/20_aquarium.png
--- a/assets/figures/20_capture_statistics.png
+++ b/assets/figures/20_capture_statistics.png
--- a/assets/figures/20_observation_vector.png
+++ b/assets/figures/20_observation_vector.png
--- a/assets/figures/21_blocking.png
+++ b/assets/figures/21_blocking.png
--- a/assets/figures/21_coins.png
+++ b/assets/figures/21_coins.png
--- a/assets/figures/21_coins_teaser.png
+++ b/assets/figures/21_coins_teaser.png
--- a/assets/figures/21_envs.png
+++ b/assets/figures/21_envs.png
--- a/assets/publications/altmann2024emergence.pdf
+++ b/assets/publications/altmann2024emergence.pdf
--- a/assets/publications/kolle2024aquarium.pdf
+++ b/assets/publications/kolle2024aquarium.pdf
--- a/nginx_default.conf
+++ b/nginx_default.conf
@ -8,8 +8,15 @@ server {
    listen  [::]:80;
    server_name  localhost;

-    location ~* \.(?:jpg|jpeg|png|webp)$ {
+    location ~* ^/.+\.(jpg|jpeg|png|gif)$ {
        root   /usr/share/nginx/html;
+        # BEGIN Browser Caching of WebP
+        expires 180d; 
+        add_header Pragma "public";
+        add_header Cache-Control "public";
+        # END Browser Caching of WebP
+
+        add_header Vary Accept;
        try_files $uri$webp_suffix $uri =404;
    }

@ -22,13 +29,12 @@ server {
    location = /404.html {
        root   /usr/share/nginx/html;
    }
-
-    # Caching headers
-    # location ~* \.(?:ico|css|js|gif|jpe?g|png)$ {
-    #     expires 30d;
-    #     add_header Pragma public;
-    #     add_header Cache-Control "public";
-    # }
+    # Browser Caching
+    location ~* \.(css|js|ico|gif|jpeg|jpg|webp|png|svg|eot|otf|woff|woff2|ttf|ogg)$ {
+        expires 180d; 
+        add_header Pragma "public";
+        add_header Cache-Control "public";
+    }

  gzip on;
  gzip_comp_level 4;