Publications

For news about publications, follow us on X:

Click on any author names or tags to filter publications.

All topic tags:
survey deep-rl multi-agent-rl agent-modelling ad-hoc-teamwork autonomous-driving goal-recognition explainable-ai causal generalisation security emergent-communication iterated-learning intrinsic-reward simulator state-estimation deep-learning transfer-learning LLM

Selected tags (click to remove):
multi-agent-rl

2025

Charlie Masters, Advaith Vellanki, Jiangbo Shangguan, Bart Kultys, Alastair Moore, Stefano V. Albrecht
Orchestrating Human-AI Teams: The Manager Agent as a Unifying Research Challenge
International Conference on Distributed Artificial Intelligence, 2025
Abstract | BibTex | arXiv | Code
DAI multi-agent-rl LLM

@inproceedings{manager_agent_gym_2025,
   title     = {Orchestrating Human-AI Teams: The Manager Agent as a Unifying Research Challenge},
   author    = {Masters, Charlie and Vellanki, Advaith and Shangguan, Jiangbo and Kultys, Bart and Moore, Alastair and Albrecht, Stefano V.},
   booktitle = {Proceedings of the International Conference on Distributed Artificial Intelligence (DAI 2025)},
   year      = {2025}
}

Kale-ab Tessera, Arrasy Rahman, Amos Storkey, Stefano V. Albrecht
HyperMARL: Adaptive Hypernetworks for Multi-Agent RL
Conference on Neural Information Processing Systems, 2025
Abstract | BibTex | arXiv | Code
NeurIPS multi-agent-rl

@inproceedings{tessera2025hypermarl,
   title={{HyperMARL}: Adaptive Hypernetworks for Multi-Agent RL},
   author={Kale-ab Tessera and Arrasy Rahman and Amos Storkey and Stefano V. Albrecht},
   booktitle={Conference on Neural Information Processing Systems},
   year={2025}
}

Lukas Schäfer, Oliver Slumbers, Stephen Mcaleer, Yali Du, Stefano V. Albrecht, David Mguni
Ensemble Value Functions for Efficient Exploration in Multi-Agent Reinforcement Learning
International Conference on Autonomous Agents and Multi-Agent Systems, 2025
Abstract | BibTex | arXiv
AAMAS multi-agent-rl

@inproceedings{schafer2025emax,
   title = {Ensemble Value Functions for Efficient Exploration in Multi-Agent Reinforcement Learning},
   author = {Lukas Sch\"afer and Oliver Slumbers and Stephen Mcaleer and Yali Du and Stefano V. Albrecht and David Mguni},
   booktitle = {International Conference on Autonomous Agents and Multiagent Systems},
   year = {2025}
}

Leonard Hinckeldey, Elliot Fosong, Elle Miller, Rimvydas Rubavicius, Trevor McInroe, Patricia Wollstadt, Christiane B. Wiebel-Herboth, Subramanian Ramamoorthy, Stefano V. Albrecht
Assistax: A Hardware-Accelerated Reinforcement Learning Benchmark for Assistive Robotics
RLC 2025 Workshop on Coordination and Cooperation in Multi-Agent Reinforcement Learning, 2025
Abstract | BibTex | arXiv | Code
RLC multi-agent-rl

@inproceedings{hinck2025assistax,
   title={{Assistax}: A Hardware-Accelerated Reinforcement Learning Benchmark for Assistive Robotics},
   author={Leonard Hinckeldey and Elliot Fosong and Elle Miller and Rimvydas Rubavicius and Trevor McInroe and Patricia Wollstadt and Christiane B. Wiebel-Herboth and Subramanian Ramamoorthy and Stefano V. Albrecht},
   booktitle={RLC 2025 Workshop on Coordination and Cooperation in Multi-Agent Reinforcement Learning},
   year={2025}
}

2024

Stefano V. Albrecht, Filippos Christianos, Lukas Schäfer
Multi-Agent Reinforcement Learning: Foundations and Modern Approaches
MIT Press (print version scheduled for December 2024), 2024
Abstract | BibTex | Book website | Book codebase
MITP multi-agent-rl deep-rl deep-learning survey

@book{ marl-book,
   author = {Stefano V. Albrecht and Filippos Christianos and Lukas Sch\"afer},
   title = {Multi-Agent Reinforcement Learning: Foundations and Modern Approaches},
   publisher = {MIT Press},
   year = {2024},
   url = {https://www.marl-book.com}
}

Aditya Kapoor, Sushant Swamy, Kale-ab Tessera, Mayank Baranwal, Mingfei Sun, Harshad Khadilkar, Stefano V. Albrecht
Agent-Temporal Credit Assignment for Optimal Policy Preservation in Sparse Multi-Agent Reinforcement Learning
RLC Workshop on Coordination and Cooperation for Multi-Agent Reinforcement Learning Methods, 2024
Abstract | BibTex | Paper
RLC deep-rl multi-agent-rl

@inproceedings{kapoor2024agenttemporal,
   title={Agent-Temporal Credit Assignment for Optimal Policy Preservation in Sparse Multi-Agent Reinforcement Learning},
   author={Aditya Kapoor and Sushant Swamy and Kale-ab Tessera and Mayank Baranwal and Mingfei Sun and Harshad Khadilkar and Stefano V Albrecht},
   booktitle={Coordination and Cooperation for Multi-Agent Reinforcement Learning Methods Workshop},
   year={2024},
   url={https://openreview.net/forum?id=dGS1e3FXUH}
}

Elliot Fosong, Arrasy Rahman, Ignacio Carlucho, Stefano V. Albrecht
Learning Complex Teamwork Tasks Using a Given Sub-task Decomposition
International Conference on Autonomous Agents and Multi-Agent Systems, 2024
Abstract | BibTex | arXiv | Code
AAMAS multi-agent-rl

@inproceedings{fosongLearningComplexTeamwork2024,
   title = {Learning Complex Teamwork Tasks Using a Given Sub-task Decomposition},
   author = {Fosong, Elliot and Rahman, Arrasy and Carlucho, Ignacio and Albrecht, Stefano V.},
   booktitle = {Proceedings of the 23rd International Conference on Autonomous Agents and Multiagent Systems},
   year = {2024}
}

Aleksandar Krnjaic, Raul D. Steleac, Jonathan D. Thomas, Georgios Papoudakis, Lukas Schäfer, Andrew Wing Keung To, Kuan-Ho Lao, Murat Cubuktepe, Matthew Haley, Peter Börsting, Stefano V. Albrecht
Scalable Multi-Agent Reinforcement Learning for Warehouse Logistics with Robotic and Human Co-Workers
IEEE/RSJ International Conference on Intelligent Robots and Systems, 2024
Abstract | BibTex | arXiv | Website
IROS multi-agent-rl simulator

@inproceedings{krnjaic2024scalable,
   title={Scalable Multi-Agent Reinforcement Learning for Warehouse Logistics with Robotic and Human Co-Workers},
   author={Aleksandar Krnjaic and Raul D. Steleac and Jonathan D. Thomas and Georgios Papoudakis and Lukas Sch\"afer and Andrew Wing Keung To and Kuan-Ho Lao and Murat Cubuktepe and Matthew Haley and Peter B\"orsting and Stefano V. Albrecht},
   booktitle={IEEE/RSJ International Conference on Intelligent Robots and Systems},
   year={2024}
}

Sarah Keren, Chaimaa Essayeh, Stefano V. Albrecht, Thomas Mortsyn
Multi-Agent Reinforcement Learning for Energy Networks: Computational Challenges, Progress and Open Problems
arXiv:2404.15583, 2024
Abstract | BibTex | arXiv
multi-agent-rl survey

@misc{keren2024multiagent,
   title={Multi-Agent Reinforcement Learning for Energy Networks: Computational Challenges, Progress and Open Problems},
   author={Sarah Keren and Chaimaa Essayeh and Stefano V. Albrecht and Thomas Mortsyn},
   year={2024},
   eprint={2404.15583},
   archivePrefix={arXiv},
   primaryClass={cs.AI}
}

Kale-ab Tessera, Arrasy Rahman, Stefano V. Albrecht
HyperMARL: Adaptive Hypernetworks for Multi-Agent RL
arXiv:2412.04233, 2024
Abstract | BibTex | arXiv
multi-agent-rl

@misc{tessera2024hyper,
   title={{HyperMARL}: Adaptive Hypernetworks for Multi-Agent RL},
   author={Kale-ab Tessera and Arrasy Rahman and Stefano V. Albrecht},
   year={2024},
   eprint={2412.04233},
   archivePrefix={arXiv}
}

2023

Arrasy Rahman, Ignacio Carlucho, Niklas Höpner, Stefano V. Albrecht
A General Learning Framework for Open Ad Hoc Teamwork Using Graph-based Policy Learning
Journal of Machine Learning Research, 2023
Abstract | BibTex | arXiv | Publisher | Code
JMLR ad-hoc-teamwork deep-rl agent-modelling multi-agent-rl

@article{JRahman2022POGPL,
   author  = {Arrasy Rahman and Ignacio Carlucho and Niklas H\"opner and Stefano V. Albrecht},
   title   = {A General Learning Framework for Open Ad Hoc Teamwork Using Graph-based Policy Learning},
   journal = {Journal of Machine Learning Research},
   year    = {2023},
   volume  = {24},
   number  = {298},
   pages   = {1--74},
   url     = {http://jmlr.org/papers/v24/22-099.html}
}

Filippos Christianos, Georgios Papoudakis, Stefano V. Albrecht
Pareto Actor-Critic for Equilibrium Selection in Multi-Agent Reinforcement Learning
Transactions on Machine Learning Research, 2023
Abstract | BibTex | arXiv | Code
TMLR deep-rl multi-agent-rl

@article{christianos2023pareto,
   title={Pareto Actor-Critic for Equilibrium Selection in Multi-Agent Reinforcement Learning},
   author={Filippos Christianos and Georgios Papoudakis and Stefano V. Albrecht},
   journal={Transactions on Machine Learning Research (TMLR)},
   year={2023}
}

Arrasy Rahman, Elliot Fosong, Ignacio Carlucho, Stefano V. Albrecht
Generating Teammates for Training Robust Ad Hoc Teamwork Agents via Best-Response Diversity
Transactions on Machine Learning Research, 2023
Abstract | BibTex | arXiv | Code
TMLR ad-hoc-teamwork multi-agent-rl deep-rl

@article{rahman2023BRDiv,
   title={Generating Teammates for Training Robust Ad Hoc Teamwork Agents via Best-Response Diversity},
   author={Arrasy Rahman and Elliot Fosong and Ignacio Carlucho and Stefano V. Albrecht},
   journal={Transactions on Machine Learning Research (TMLR)},
   year={2023}
}

Lukas Schäfer, Filippos Christianos, Amos Storkey, Stefano V. Albrecht
Learning Task Embeddings for Teamwork Adaptation in Multi-Agent Reinforcement Learning
NeurIPS Workshop on Generalization in Planning, 2023
Abstract | BibTex | arXiv | Code
NeurIPS multi-agent-rl deep-rl

@inproceedings{schaefer2023mate,
   title={Learning Task Embeddings for Teamwork Adaptation in Multi-Agent Reinforcement Learning},
   author={Lukas Schäfer and Filippos Christianos and Amos Storkey and Stefano V. Albrecht},
   booktitle={NeurIPS Workshop on Generalization in Planning},
   year={2023}
}

Filippos Christianos, Georgios Papoudakis, Stefano V. Albrecht
Pareto Actor-Critic for Equilibrium Selection in Multi-Agent Reinforcement Learning
AAMAS Workshop on Optimization and Learning in Multiagent Systems, 2023
Abstract | BibTex | arXiv
AAMAS deep-rl multi-agent-rl

@inproceedings{christianos2023pareto,
   title={Pareto Actor-Critic for Equilibrium Selection in Multi-Agent Reinforcement Learning},
   author={Filippos Christianos and Georgios Papoudakis and Stefano V. Albrecht},
   booktitle={AAMAS Workshop on Optimization and Learning in Multiagent Systems},
   year={2023}
}

Elliot Fosong, Arrasy Rahman, Ignacio Carlucho, Stefano V. Albrecht
Learning Complex Teamwork Tasks Using a Sub-task Curriculum
AAMAS Workshop on Multiagent Sequential Decision Making Under Uncertainty, 2023
Abstract | BibTex | arXiv | Code
AAMAS multi-agent-rl ad-hoc-teamwork transfer-learning

@inproceedings{fosong2023learning,
   title={Learning complex teamwork tasks using a sub-task curriculum},
   author={Elliot Fosong, Arrasy Rahman, Ignacio Carlucho and Stefano V. Albrecht},
   booktitle={AAMAS Workshop on Multiagent Sequential Decision Making under Uncertainty},
   year={2023},
}

Adam Michalski, Filippos Christianos, Stefano V. Albrecht
SMAClite: A Lightweight Environment for Multi-Agent Reinforcement Learning
AAMAS Workshop on Multiagent Sequential Decision Making Under Uncertainty, 2023
Abstract | BibTex | arXiv | Code
AAMAS deep-rl multi-agent-rl

@inproceedings{michalski2023smaclite,
   title={SMAClite: A Lightweight Environment for Multi-Agent Reinforcement Learning},
   author={Adam Michalski and Filippos Christianos and Stefano V. Albrecht},
   booktitle={AAMAS workshop on Multiagent Sequential Decision Making Under Uncertainty (MSDM)},
   year={2023}
}

Lukas Schäfer, Oliver Slumbers, Stephen McAleer, Yali Du, Stefano V. Albrecht, David Mguni
Ensemble Value Functions for Efficient Exploration in Multi-Agent Reinforcement Learning
AAMAS Workshop on Adaptive and Learning Agents, 2023
Abstract | BibTex | arXiv
AAMAS multi-agent-rl deep-rl

@inproceedings{schaefer2023emax,
   title={Ensemble Value Functions for Efficient Exploration in Multi-Agent Reinforcement Learning},
   author={Lukas Schäfer and Oliver Slumbers and Stephen McAleer and Yali Du and Stefano V. Albrecht and David Mguni},
   year={2023},
   booktitle={AAMAS Workshop on Adaptive and Learning Agents (ALA)},
}

Callum Tilbury, Filippos Christianos, Stefano V. Albrecht
Revisiting the Gumbel-Softmax in MADDPG
AAMAS Workshop on Adaptive and Learning Agents, 2023
Abstract | BibTex | arXiv | Code
AAMAS multi-agent-rl deep-rl

@inproceedings{tilbury2023revisitingmaddpg,
   title={Revisiting the Gumbel-Softmax in MADDPG},
   author={Callum Tilbury and Filippos Christianos and Stefano V. Albrecht},
   year={2023},
   booktitle={AAMAS Workshop on Adaptive and Learning Agents (ALA)},
}

Aleksandar Krnjaic, Raul D. Steleac, Jonathan D. Thomas, Georgios Papoudakis, Lukas Schäfer, Andrew Wing Keung To, Kuan-Ho Lao, Murat Cubuktepe, Matthew Haley, Peter Börsting, Stefano V. Albrecht
Scalable Multi-Agent Reinforcement Learning for Warehouse Logistics with Robotic and Human Co-Workers
arXiv:2212.11498, 2023
Abstract | BibTex | arXiv | Website
multi-agent-rl simulator

@misc{krnjaic2023scalable,
   title={Scalable Multi-Agent Reinforcement Learning for Warehouse Logistics with Robotic and Human Co-Workers},
   author={Aleksandar Krnjaic and Raul D. Steleac and Jonathan D. Thomas and Georgios Papoudakis and Lukas Sch\"afer and Andrew Wing Keung To and Kuan-Ho Lao and Murat Cubuktepe and Matthew Haley and Peter B\"orsting and Stefano V. Albrecht},
   year={2023},
   eprint={2212.11498},
   archivePrefix={arXiv},
   primaryClass={cs.LG}
}

2022

Stefano V. Albrecht, Michael Wooldridge
Special Issue on Multi-Agent Systems Research in the United Kingdom: Guest Editorial
AI Communications, 2022
Abstract | BibTex | Publisher | Special Issue
AIC survey deep-rl multi-agent-rl agent-modelling

@article{albrecht2020special,
   title = {Special Issue on Multi-Agent Systems Research in the United Kingdom: Guest Editorial},
   author = {Stefano V. Albrecht and Michael Wooldridge},
   journal = {AI Communications},
   volume = {35},
   number = {4},
   year = {2022},
   publisher = {IOS Press},
   url = {https://content.iospress.com/articles/ai-communications/aic229003}
}

Ibrahim H. Ahmed, Cillian Brewitt, Ignacio Carlucho, Filippos Christianos, Mhairi Dunion, Elliot Fosong, Samuel Garcin, Shangmin Guo, Balint Gyevnar, Trevor McInroe, Georgios Papoudakis, Arrasy Rahman, Lukas Schäfer, Massimiliano Tamborski, Giuseppe Vecchio, Cheng Wang, Stefano V. Albrecht
Deep Reinforcement Learning for Multi-Agent Interaction
AI Communications, 2022
Abstract | BibTex | arXiv | Publisher
AIC survey deep-rl multi-agent-rl ad-hoc-teamwork agent-modelling goal-recognition security explainable-ai autonomous-driving

@article{albrecht2022aic,
   author = {Ahmed, Ibrahim H. and Brewitt, Cillian and Carlucho, Ignacio and Christianos, Filippos and Dunion, Mhairi and Fosong, Elliot and Garcin, Samuel and Guo, Shangmin and Gyevnar, Balint and McInroe, Trevor and Papoudakis, Georgios and Rahman, Arrasy and Schäfer, Lukas and Tamborski, Massimiliano and Vecchio, Giuseppe and Wang, Cheng and Albrecht, Stefano V.},
   title = {Deep Reinforcement Learning for Multi-Agent Interaction},
   journal = {AI Communications, Special Issue on Multi-Agent Systems Research in the UK},
   year = {2022}
}

Shangmin Guo, Yi Ren, Kory Mathewson, Simon Kirby, Stefano V. Albrecht, Kenny Smith
Expressivity of Emergent Languages is a Trade-off between Contextual Complexity and Unpredictability
International Conference on Learning Representations, 2022
Abstract | BibTex | arXiv | Code
ICLR multi-agent-rl emergent-communication

@inproceedings{guo2022expressivity,
   title={Expressivity of Emergent Languages is a Trade-off between Contextual Complexity and Unpredictability},
   author={Shangmin Guo and Yi Ren and Kory Mathewson and Simon Kirby and Stefano V. Albrecht and Kenny Smith},
   booktitle={International Conference on Learning Representations (ICLR)},
   year={2022}
}

Lukas Schäfer
Task Generalisation in Multi-Agent Reinforcement Learning
International Conference on Autonomous Agents and Multiagent Systems, Doctoral Consortium, 2022
Abstract | BibTex | Paper
AAMAS multi-agent-rl

@inproceedings{schaefer2022task,
   title={Task Generalisation in Multi-Agent Reinforcement Learning},
   author={Lukas Schäfer},
   booktitle={Doctoral Consortium at the International Conference on Autonomous Agents and Multiagent Systems},
   year={2022}
}

Filippos Christianos
Collaborative Training of Multiple Autonomous Agents
International Conference on Autonomous Agents and Multiagent Systems, Doctoral Consortium, 2022
Abstract | BibTex | Paper
AAMAS multi-agent-rl

@inproceedings{christianos2022collaborative,
   title={Collaborative Training of Multiple Autonomous Agents},
   author={Filippos Christianos},
   booktitle={Doctoral Consortium at the International Conference on Autonomous Agents and Multiagent Systems},
   year={2022}
}

Arrasy Rahman, Elliot Fosong, Ignacio Carlucho, Stefano V. Albrecht
Towards Robust Ad Hoc Teamwork Agents By Creating Diverse Training Teammates
IJCAI Workshop on Ad Hoc Teamwork, 2022
Abstract | BibTex | arXiv | Code
IJCAI ad-hoc-teamwork multi-agent-rl

@inproceedings{rahman2022towards,
   title={Towards Robust Ad Hoc Teamwork Agents By Creating Diverse Training Teammates},
   author={Arrasy Rahman and Elliot Fosong and Ignacio Carlucho and Stefano V. Albrecht},
   booktitle={IJCAI Workshop on Ad Hoc Teamwork},
   year={2022}
}

Elliot Fosong, Arrasy Rahman, Ignacio Carlucho, Stefano V. Albrecht
Few-Shot Teamwork
IJCAI Workshop on Ad Hoc Teamwork, 2022
Abstract | BibTex | arXiv
IJCAI ad-hoc-teamwork multi-agent-rl

@inproceedings{fosong2022fewshot,
   title={Few-Shot Teamwork},
   author={Elliot Fosong and Arrasy Rahman and Ignacio Carlucho and Stefano V. Albrecht},
   booktitle={IJCAI Workshop on Ad Hoc Teamwork},
   year={2022}
}

Ignacio Carlucho, Arrasy Rahman, William Ard, Elliot Fosong, Corina Barbalata, Stefano V. Albrecht
Cooperative Marine Operations Via Ad Hoc Teams
IJCAI Workshop on Ad Hoc Teamwork, 2022
Abstract | BibTex | arXiv
IJCAI ad-hoc-teamwork multi-agent-rl

@inproceedings{Carlucho2022UnderwaterAHT,
   title={Cooperative Marine Operations Via Ad Hoc Teams},
   author={Ignacio Carlucho, Arrasy Rahman, William Ard, Elliot Fosong, Corina Barbalata, Stefano V. Albrecht},
   booktitle={IJCAI Workshop on Ad Hoc Teamwork},
   year={2022}
}

Aleksandar Krnjaic, Jonathan D. Thomas, Georgios Papoudakis, Lukas Schäfer, Peter Börsting, Stefano V. Albrecht
Scalable Multi-Agent Reinforcement Learning for Warehouse Logistics with Robotic and Human Co-Workers
arXiv:2212.11498, 2022
Abstract | BibTex | arXiv
deep-rl multi-agent-rl

@misc{Krnjaic2022HSNAC,
   title={Scalable Multi-Agent Reinforcement Learning for Warehouse Logistics with Robotic and Human Co-Workers},
   author={Aleksandar Krnjaic and Jonathan D. Thomas and Georgios Papoudakis and Lukas Sch\"afer and Peter B\"orsting and Stefano V. Albrecht,
   year={2022},
   eprint={2212.11498},
   archivePrefix={arXiv}
}

Lukas Schäfer, Filippos Christianos, Amos Storkey, Stefano V. Albrecht
Learning Task Embeddings for Teamwork Adaptation in Multi-Agent Reinforcement Learning
arxiv:2207.02249, 2022
Abstract | BibTex | arXiv
deep-rl multi-agent-rl

@misc{schaefer2022mate,
   title={Learning Task Embeddings for Teamwork Adaptation in Multi-Agent Reinforcement Learning},
   author={Lukas Schäfer and Filippos Christianos and Amos Storkey and Stefano V. Albrecht},
   year={2022},
   eprint={2207.02249},
   archivePrefix={arXiv},
   primaryClass={cs.MA}
}

Filippos Christianos, Georgios Papoudakis, Stefano V. Albrecht
Pareto Actor-Critic for Equilibrium Selection in Multi-Agent Reinforcement Learning
arXiv:2209.14344, 2022
Abstract | BibTex | arXiv
deep-rl multi-agent-rl

@misc{christianos2022pareto,
   title={Pareto Actor-Critic for Equilibrium Selection in Multi-Agent Reinforcement Learning},
   author={Filippos Christianos and Georgios Papoudakis and Stefano V. Albrecht},
   year={2022},
   eprint={2209.14344},
   archivePrefix={arXiv},
   primaryClass={cs.LG}
}

2021

Georgios Papoudakis, Filippos Christianos, Lukas Schäfer, Stefano V. Albrecht
Benchmarking Multi-Agent Deep Reinforcement Learning Algorithms in Cooperative Tasks
Conference on Neural Information Processing Systems, Datasets and Benchmarks Track, 2021
Abstract | BibTex | arXiv | Code
NeurIPS deep-rl multi-agent-rl

@inproceedings{papoudakis2021benchmarking,
   title={Benchmarking Multi-Agent Deep Reinforcement Learning Algorithms in Cooperative Tasks},
   author={Georgios Papoudakis and Filippos Christianos and Lukas Sch\"afer and Stefano V. Albrecht},
   booktitle = {Proceedings of the Neural Information Processing Systems Track on Datasets and Benchmarks (NeurIPS)},
   year={2021},
   url = {http://arxiv.org/abs/2006.07869},
   openreview = {https://openreview.net/forum?id=cIrPX-Sn5n},
   code = {https://github.com/uoe-agents/epymarl}
}

Filippos Christianos, Georgios Papoudakis, Arrasy Rahman, Stefano V. Albrecht
Scaling Multi-Agent Reinforcement Learning with Selective Parameter Sharing
International Conference on Machine Learning, 2021
Abstract | BibTex | arXiv | Video | Code
ICML deep-rl multi-agent-rl

@inproceedings{christianos2021scaling,
   title={Scaling Multi-Agent Reinforcement Learning with Selective Parameter Sharing},
   author={Filippos Christianos and Georgios Papoudakis and Arrasy Rahman and Stefano V. Albrecht},
   booktitle={International Conference on Machine Learning (ICML)},
   year={2021}
}

Shangmin Guo, Yi Ren, Kory Mathewson, Simon Kirby, Stefano V. Albrecht, Kenny Smith
Expressivity of Emergent Language is a Trade-off between Contextual Complexity and Unpredictability
arXiv:2106.03982, 2021
Abstract | BibTex | arXiv
multi-agent-rl emergent-communication

@misc{guo2021expressivity,
   title={Expressivity of Emergent Language is a Trade-off between Contextual Complexity and Unpredictability},
   author={Shangmin Guo and Yi Ren and Kory Mathewson and Simon Kirby and Stefano V. Albrecht and Kenny Smith},
   year={2021},
   eprint={2106.03982},
   archivePrefix={arXiv},
   primaryClass={cs.CL}
}

2020

Filippos Christianos, Lukas Schäfer, Stefano V. Albrecht
Shared Experience Actor-Critic for Multi-Agent Reinforcement Learning
Conference on Neural Information Processing Systems, 2020
Abstract | BibTex | arXiv
NeurIPS deep-rl multi-agent-rl

@inproceedings{christianos2020shared,
   title={Shared Experience Actor-Critic for Multi-Agent Reinforcement Learning},
   author={Filippos Christianos and Lukas Sch\"afer and Stefano V. Albrecht},
   booktitle={34th Conference on Neural Information Processing Systems},
   year={2020}
}

Georgios Papoudakis, Filippos Christianos , Lukas Schäfer, Stefano V. Albrecht
Comparative Evaluation of Multi-Agent Deep Reinforcement Learning Algorithms
arXiv:2006.07869, 2020
Abstract | BibTex | arXiv
deep-rl multi-agent-rl

@misc{papoudakis2020comparative,
   title={Comparative Evaluation of Multi-Agent Deep Reinforcement Learning Algorithms},
   author={Georgios Papoudakis and Filippos Christianos and Lukas Sch\"afer and Stefano V. Albrecht},
   year={2020},
   eprint={2006.07869},
   archivePrefix={arXiv},
   primaryClass={cs.LG}
}

2019

Georgios Papoudakis, Filippos Christianos, Arrasy Rahman, Stefano V. Albrecht
Dealing with Non-Stationarity in Multi-Agent Deep Reinforcement Learning
arXiv:1906.04737, 2019
Abstract | BibTex | arXiv
survey deep-rl multi-agent-rl

@misc{papoudakis2019dealing,
   title={Dealing with Non-Stationarity in Multi-Agent Deep Reinforcement Learning},
   author={Georgios Papoudakis and Filippos Christianos and Arrasy Rahman and Stefano V. Albrecht},
   year={2019},
   eprint={1906.04737},
   archivePrefix={arXiv},
   primaryClass={cs.LG}
}

2012

Stefano V. Albrecht, Subramanian Ramamoorthy
Comparative Evaluation of Multiagent Learning Algorithms in a Diverse Set of Ad Hoc Team Problems
International Conference on Autonomous Agents and Multiagent Systems, 2012
Abstract | BibTex | arXiv
AAMAS multi-agent-rl ad-hoc-teamwork

@inproceedings{ albrecht2012comparative,
   title = {Comparative Evaluation of {MAL} Algorithms in a Diverse Set of Ad Hoc Team Problems},
   author = {Stefano V. Albrecht and Subramanian Ramamoorthy},
   booktitle = {Proceedings of the 11th International Conference on Autonomous Agents and Multiagent Systems},
   pages = {349--356},
   year = {2012}
}