Publications

For news about publications, follow us on X:

Click on any author names or tags to filter publications.

All topic tags:
survey deep-rl multi-agent-rl agent-modelling ad-hoc-teamwork autonomous-driving goal-recognition explainable-ai causal generalisation security emergent-communication iterated-learning intrinsic-reward simulator state-estimation deep-learning transfer-learning

Selected tags (click to remove):
agent-modelling

2025

Cheng Wang, Lingxin Kong, Massimiliano Tamborski, Stefano V. Albrecht
HAD-Gen: Human-like and Diverse Driving Behavior Modeling for Controllable Scenario Generation
arXiv:2503.15049, 2025
Abstract | BibTex | arXiv
autonomous-driving agent-modelling

@misc{tessera2025hyper,
   title={{HAD-Gen}: Human-like and Diverse Driving Behavior Modeling for Controllable Scenario Generation},
   author={Cheng Wang and Lingxin Kong and Massimiliano Tamborski and Stefano V. Albrecht},
   year={2025},
   eprint={503.15049},
   archivePrefix={arXiv}
}

2023

Arrasy Rahman, Ignacio Carlucho, Niklas Höpner, Stefano V. Albrecht
A General Learning Framework for Open Ad Hoc Teamwork Using Graph-based Policy Learning
Journal of Machine Learning Research, 2023
Abstract | BibTex | arXiv | Publisher | Code
JMLR ad-hoc-teamwork deep-rl agent-modelling multi-agent-rl

@article{JRahman2022POGPL,
   author  = {Arrasy Rahman and Ignacio Carlucho and Niklas H\"opner and Stefano V. Albrecht},
   title   = {A General Learning Framework for Open Ad Hoc Teamwork Using Graph-based Policy Learning},
   journal = {Journal of Machine Learning Research},
   year    = {2023},
   volume  = {24},
   number  = {298},
   pages   = {1--74},
   url     = {http://jmlr.org/papers/v24/22-099.html}
}

2022

Stefano V. Albrecht, Michael Wooldridge
Special Issue on Multi-Agent Systems Research in the United Kingdom: Guest Editorial
AI Communications, 2022
Abstract | BibTex | Publisher | Special Issue
AIC survey deep-rl multi-agent-rl agent-modelling

@article{albrecht2020special,
   title = {Special Issue on Multi-Agent Systems Research in the United Kingdom: Guest Editorial},
   author = {Stefano V. Albrecht and Michael Wooldridge},
   journal = {AI Communications},
   volume = {35},
   number = {4},
   year = {2022},
   publisher = {IOS Press},
   url = {https://content.iospress.com/articles/ai-communications/aic229003}
}

Ibrahim H. Ahmed, Cillian Brewitt, Ignacio Carlucho, Filippos Christianos, Mhairi Dunion, Elliot Fosong, Samuel Garcin, Shangmin Guo, Balint Gyevnar, Trevor McInroe, Georgios Papoudakis, Arrasy Rahman, Lukas Schäfer, Massimiliano Tamborski, Giuseppe Vecchio, Cheng Wang, Stefano V. Albrecht
Deep Reinforcement Learning for Multi-Agent Interaction
AI Communications, 2022
Abstract | BibTex | arXiv | Publisher
AIC survey deep-rl multi-agent-rl ad-hoc-teamwork agent-modelling goal-recognition security explainable-ai autonomous-driving

@article{albrecht2022aic,
   author = {Ahmed, Ibrahim H. and Brewitt, Cillian and Carlucho, Ignacio and Christianos, Filippos and Dunion, Mhairi and Fosong, Elliot and Garcin, Samuel and Guo, Shangmin and Gyevnar, Balint and McInroe, Trevor and Papoudakis, Georgios and Rahman, Arrasy and Schäfer, Lukas and Tamborski, Massimiliano and Vecchio, Giuseppe and Wang, Cheng and Albrecht, Stefano V.},
   title = {Deep Reinforcement Learning for Multi-Agent Interaction},
   journal = {AI Communications, Special Issue on Multi-Agent Systems Research in the UK},
   year = {2022}
}

Arrasy Rahman, Ignacio Carlucho, Niklas Höpner, Stefano V. Albrecht
A General Learning Framework for Open Ad Hoc Teamwork Using Graph-based Policy Learning
arXiv:2210.05448, 2022
Abstract | BibTex | arXiv
ad-hoc-teamwork deep-rl agent-modelling

@misc{Rahman2022POGPL,
   title={A General Learning Framework for Open Ad Hoc Teamwork Using Graph-based Policy Learning},
   author={Arrasy Rahman and Ignacio Carlucho and Niklas H\"opner and Stefano V. Albrecht},
   year={2022},
   eprint={2210.05448},
   archivePrefix={arXiv}
}

2021

Georgios Papoudakis, Filippos Christianos, Stefano V. Albrecht
Agent Modelling under Partial Observability for Deep Reinforcement Learning
Conference on Neural Information Processing Systems, 2021
Abstract | BibTex | arXiv | Code
NeurIPS deep-rl agent-modelling

@inproceedings{papoudakis2021local,
   title={Agent Modelling under Partial Observability for Deep Reinforcement Learning},
   author={Georgios Papoudakis and Filippos Christianos and Stefano V. Albrecht},
   booktitle = {Proceedings of the Neural Information Processing Systems (NeurIPS)},
   year = {2021}
}

Arrasy Rahman, Niklas Höpner, Filippos Christianos, Stefano V. Albrecht
Towards Open Ad Hoc Teamwork Using Graph-based Policy Learning
International Conference on Machine Learning, 2021
Abstract | BibTex | arXiv | Video | Code
ICML deep-rl agent-modelling ad-hoc-teamwork

@inproceedings{rahman2021open,
   title={Towards Open Ad Hoc Teamwork Using Graph-based Policy Learning},
   author={Arrasy Rahman and Niklas H\"opner and Filippos Christianos and Stefano V. Albrecht},
   booktitle={International Conference on Machine Learning (ICML)},
   year={2021}
}

Ibrahim H. Ahmed, Josiah P. Hanna, Elliot Fosong, Stefano V. Albrecht
Towards Quantum-Secure Authentication and Key Agreement via Abstract Multi-Agent Interaction
International Conference on Practical Applications of Agents and Multi-Agent Systems, 2021
Abstract | BibTex | arXiv | Publisher | Code
PAAMS security agent-modelling

@inproceedings{ahmed2021quantum,
   title={Towards Quantum-Secure Authentication and Key Agreement via Abstract Multi-Agent Interaction},
   author={Ibrahim H. Ahmed and Josiah P. Hanna and Elliot Fosong and Stefano V. Albrecht},
   booktitle={International Conference on Practical Applications of Agents and Multi-Agent Systems (PAAMS)},
   year={2021}
}

2020

Stefano V. Albrecht, Peter Stone, Michael P. Wellman
Special Issue on Autonomous Agents Modelling Other Agents: Guest Editorial
Artificial Intelligence, 2020
Abstract | BibTex | Publisher | Special Issue
AIJ survey agent-modelling

@article{albrecht2020special,
   title = {Special Issue on Autonomous Agents Modelling Other Agents: Guest Editorial},
   author = {Stefano V. Albrecht and Peter Stone and Michael P. Wellman},
   journal = {Artificial Intelligence},
   volume = {285},
   year = {2020},
   publisher = {Elsevier},
   url = {https://doi.org/10.1016/j.artint.2020.103292}
}

Georgios Papoudakis, Stefano V. Albrecht
Variational Autoencoders for Opponent Modeling in Multi-Agent Systems
AAAI Workshop on Reinforcement Learning in Games, 2020
Abstract | BibTex | arXiv
AAAI deep-rl agent-modelling

@inproceedings{papoudakis2020variational,
   title={Variational Autoencoders for Opponent Modeling in Multi-Agent Systems},
   author={Georgios Papoudakis and Stefano V. Albrecht},
   booktitle={AAAI Workshop on Reinforcement Learning in Games},
   year={2020}
}

Arrasy Rahman, Niklas Höpner, Filippos Christianos, Stefano V. Albrecht
Open Ad Hoc Teamwork using Graph-based Policy Learning
arXiv:2006.10412, 2020
Abstract | BibTex | arXiv
deep-rl agent-modelling ad-hoc-teamwork

@misc{rahman2020open,
   title={Open Ad Hoc Teamwork using Graph-based Policy Learning},
   author={Arrasy Rahman and Niklas H\"opner and Filippos Christianos and Stefano V. Albrecht},
   year={2020},
   eprint={2006.10412},
   archivePrefix={arXiv},
   primaryClass={cs.LG}
}

Georgios Papoudakis, Filippos Christianos, Stefano V. Albrecht
Local Information Opponent Modelling Using Variational Autoencoders
arXiv:2006.09447, 2020
Abstract | BibTex | arXiv
deep-rl agent-modelling

@misc{papoudakis2020opponent,
   title={Local Information Opponent Modelling Using Variational Autoencoders},
   author={Georgios Papoudakis and Filippos Christianos and Stefano V. Albrecht},
   year={2020},
   eprint={2006.09447},
   archivePrefix={arXiv},
   primaryClass={cs.LG}
}

Ibrahim H. Ahmed, Josiah P. Hanna, Stefano V. Albrecht
Quantum-Secure Authentication via Abstract Multi-Agent Interaction
arXiv:2007.09327, 2020
Abstract | BibTex | arXiv
security agent-modelling

@misc{ahmed2020quantumsecure,
   title={Quantum-Secure Authentication via Abstract Multi-Agent Interaction},
   author={Ibrahim H. Ahmed and Josiah P. Hanna and Stefano V. Albrecht},
   year={2020},
   eprint={2007.09327},
   archivePrefix={arXiv},
   primaryClass={cs.CR}
}

2018

Stefano V. Albrecht, Peter Stone
Autonomous Agents Modelling Other Agents: A Comprehensive Survey and Open Problems
Artificial Intelligence, 2018
Abstract | BibTex | arXiv | Publisher
AIJ survey agent-modelling goal-recognition

@article{ albrecht2018modelling,
   title = {Autonomous Agents Modelling Other Agents: A Comprehensive Survey and Open Problems},
   author = {Stefano V. Albrecht and Peter Stone},
   journal = {Artificial Intelligence},
   volume = {258},
   pages = {66--95},
   year = {2018},
   publisher = {Elsevier},
   note = {DOI: 10.1016/j.artint.2018.01.002}
}

2017

Stefano V. Albrecht, Peter Stone
Reasoning about Hypothetical Agent Behaviours and their Parameters
International Conference on Autonomous Agents and Multiagent Systems, 2017
Abstract | BibTex | arXiv
AAMAS ad-hoc-teamwork agent-modelling

@inproceedings{ albrecht2017reasoning,
   title = {Reasoning about Hypothetical Agent Behaviours and their Parameters},
   author = {Stefano V. Albrecht and Peter Stone},
   booktitle = {Proceedings of the 16th International Conference on Autonomous Agents and Multiagent Systems},
   pages = {547--555},
   year = {2017}
}

2016

Stefano V. Albrecht, Jacob W. Crandall, Subramanian Ramamoorthy
Belief and Truth in Hypothesised Behaviours
Artificial Intelligence, 2016
Abstract | BibTex | arXiv | Publisher
AIJ agent-modelling ad-hoc-teamwork

@article{ albrecht2016belief,
   title = {Belief and Truth in Hypothesised Behaviours},
   author = {Stefano V. Albrecht and Jacob W. Crandall and Subramanian Ramamoorthy},
   journal = {Artificial Intelligence},
   volume = {235},
   pages = {63--94},
   year = {2016},
   publisher = {Elsevier},
   note = {DOI: 10.1016/j.artint.2016.02.004}
}

2015

Stefano V. Albrecht, Subramanian Ramamoorthy
Are You Doing What I Think You Are Doing? Criticising Uncertain Agent Models
Conference on Uncertainty in Artificial Intelligence, 2015
Abstract | BibTex | arXiv
UAI agent-modelling

@inproceedings{ albrecht2015criticising,
   title = {Are You Doing What {I} Think You Are Doing? Criticising Uncertain Agent Models},
   author = {Stefano V. Albrecht and Subramanian Ramamoorthy},
   booktitle = {Proceedings of the 31st Conference on Uncertainty in Artificial Intelligence},
   pages = {52--61},
   year = {2015}
}

Stefano V. Albrecht, Jacob W. Crandall, Subramanian Ramamoorthy
An Empirical Study on the Practical Impact of Prior Beliefs over Policy Types
AAAI Conference on Artificial Intelligence, 2015
Abstract | BibTex | arXiv | Appendix
AAAI agent-modelling ad-hoc-teamwork

@inproceedings{ albrecht2015empirical,
   title = {An Empirical Study on the Practical Impact of Prior Beliefs over Policy Types},
   author = {Stefano V. Albrecht and Jacob W. Crandall and Subramanian Ramamoorthy},
   booktitle = {Proceedings of the 29th AAAI Conference on Artificial Intelligence},
   pages = {1988--1994},
   year = {2015}
}

Stefano V. Albrecht, Jacob W. Crandall, Subramanian Ramamoorthy
E-HBA: Using Action Policies for Expert Advice and Agent Typification
AAAI Workshop on Multiagent Interaction without Prior Coordination, 2015
Abstract | BibTex | arXiv | Appendix
AAAI agent-modelling ad-hoc-teamwork

@inproceedings{ albrecht2015ehba,
   title = {{E-HBA}: Using Action Policies for Expert Advice and Agent Typification},
   author = {Stefano V. Albrecht and Jacob W. Crandall and Subramanian Ramamoorthy},
   booktitle = {AAAI Workshop on Multiagent Interaction without Prior Coordination},
   address = {Austin, Texas, USA},
   month = {January},
   year = {2015}
}

2014

Stefano V. Albrecht, Subramanian Ramamoorthy
On Convergence and Optimality of Best-Response Learning with Policy Types in Multiagent Systems
Conference on Uncertainty in Artificial Intelligence, 2014
Abstract | BibTex | arXiv | Appendix
UAI agent-modelling

@inproceedings{ albrecht2014convergence,
   title = {On Convergence and Optimality of Best-Response Learning with Policy Types in Multiagent Systems},
   author = {Stefano V. Albrecht and Subramanian Ramamoorthy},
   booktitle = {Proceedings of the 30th Conference on Uncertainty in Artificial Intelligence},
   pages = {12--21},
   year = {2014}
}

2013

Stefano V. Albrecht, Subramanian Ramamoorthy
A Game-Theoretic Model and Best-Response Learning Method for Ad Hoc Coordination in Multiagent Systems
International Conference on Autonomous Agents and Multiagent Systems, 2013
Abstract | BibTex | arXiv (full technical report) | Extended Abstract
AAMAS ad-hoc-teamwork agent-modelling

@inproceedings{ albrecht2013game,
   title = {A Game-Theoretic Model and Best-Response Learning Method for Ad Hoc Coordination in Multiagent Systems},
   author = {Stefano V. Albrecht and Subramanian Ramamoorthy},
   booktitle = {Proceedings of the 12th International Conference on Autonomous Agents and Multiagent Systems},
   address = {St. Paul, Minnesota, USA},
   month = {May},
   year = {2013}
}