Publications

For news about publications, follow us on X:

Click on any author names or tags to filter publications.

All topic tags:
survey deep-rl multi-agent-rl agent-modelling ad-hoc-teamwork autonomous-driving goal-recognition explainable-ai causal generalisation security emergent-communication iterated-learning intrinsic-reward simulator state-estimation deep-learning transfer-learning

Selected tags (click to remove):
ICLR

2025

Samuel Garcin, Trevor McInroe, Pablo Samuel Castro, Christopher G. Lucas, David Abel, Prakash Panangaden, Stefano V. Albrecht
Studying the Interplay Between the Actor and Critic Representations in Reinforcement Learning
International Conference on Learning Representations, 2025
Abstract | BibTex | Paper | Code
ICLR deep-rl generalisation

@inproceedings{garcin2025acrep,
   title={Studying the Interplay Between the Actor and Critic Representations in Reinforcement Learning},
   author={Samuel Garcin and Trevor McInroe and Pablo Samuel Castro and Christopher G. Lucas and David Abel and Prakash Panangaden and Stefano V. Albrecht},
   booktitle={13th International Conference on Learning Representations},
   year={2025}
}

Xu Liu, Haobo Fu, Stefano V. Albrecht, Qiang Fu, Shuai Li
Online-to-Offline RL for Agent Alignment
International Conference on Learning Representations, 2025
Abstract | BibTex | Paper | Code
ICLR deep-learning

@inproceedings{liu2025aligngap,
   title={Online-to-Offline RL for Agent Alignment},
   author={Xu Liu and Haobo Fu and Stefano V. Albrecht and Qiang Fu and Shuai Li},
   booktitle={13th International Conference on Learning Representations},
   year={2025}
}

2024

Shangmin Guo, Yi Ren, Stefano V. Albrecht, Kenny Smith
lpNTK: Better Generalisation with Less Data via Sample Interaction During Learning
International Conference on Learning Representations, 2024
Abstract | BibTex | arXiv | Code
ICLR deep-learning

@inproceedings{guo2024lpntk,
   title={Sample Relationship from Learning Dynamics Matters for Generalisation},
   author={Shangmin Guo and Yi Ren and Stefano V. Albrecht and Kenny Smith},
   booktitle={12th International Conference on Learning Representations},
   year={2024},
   url={https://openreview.net/forum?id=8Ju0VmvMCW}
}

2023

Mhairi Dunion, Trevor McInroe, Kevin Sebastian Luck, Josiah Hanna, Stefano V. Albrecht
Temporal Disentanglement of Representations for Improved Generalisation in Reinforcement Learning
International Conference on Learning Representations, 2023
Abstract | BibTex | arXiv | Code
ICLR deep-rl generalisation causal

@inproceedings{dunion2023ted,
   title={Temporal Disentanglement of Representations for Improved Generalisation in Reinforcement Learning},
   author={Mhairi Dunion and Trevor McInroe and Kevin Sebastian Luck and Josiah Hanna and Stefano V. Albrecht},
   booktitle={International Conference on Learning Representations (ICLR)},
   year={2023}
}

Yi Ren, Shangmin Guo, Wonho Bae, Danica J. Sutherland
How to Prepare Your Task Head for Finetuning
International Conference on Learning Representations, 2023
Abstract | BibTex | arXiv
ICLR deep-learning transfer-learning

@inproceedings{ ren2023how,
   title={How to Prepare Your Task Head for Finetuning},
   author={Yi Ren and Shangmin Guo and Wonho Bae and Danica J. Sutherland},
   booktitle={International Conference on Learning Representations (ICLR)},
   year={2023},
   url={https://openreview.net/forum?id=gVOXZproe-e}
}

2022

Shangmin Guo, Yi Ren, Kory Mathewson, Simon Kirby, Stefano V. Albrecht, Kenny Smith
Expressivity of Emergent Languages is a Trade-off between Contextual Complexity and Unpredictability
International Conference on Learning Representations, 2022
Abstract | BibTex | arXiv | Code
ICLR multi-agent-rl emergent-communication

@inproceedings{guo2022expressivity,
   title={Expressivity of Emergent Languages is a Trade-off between Contextual Complexity and Unpredictability},
   author={Shangmin Guo and Yi Ren and Kory Mathewson and Simon Kirby and Stefano V. Albrecht and Kenny Smith},
   booktitle={International Conference on Learning Representations (ICLR)},
   year={2022}
}