Publications

For news about publications, follow us on X/Twitter:

Click on any author names or tags to filter publications.

All topic tags:
survey deep-rl multi-agent-rl agent-modelling ad-hoc-teamwork autonomous-driving goal-recognition explainable-ai causal generalisation security emergent-communication iterated-learning intrinsic-reward simulator state-estimation deep-learning transfer-learning

Selected tags (click to remove):
multi-agent-rl Stefano-V.-Albrecht

2024

Stefano V. Albrecht, Filippos Christianos, Lukas Schäfer
Multi-Agent Reinforcement Learning: Foundations and Modern Approaches
MIT Press (print version scheduled for fall 2024), 2024
Abstract | BibTex | Book website | Book codebase
MITP multi-agent-rl deep-rl deep-learning survey

@book{ marl-book,
   author = {Stefano V. Albrecht and Filippos Christianos and Lukas Sch\"afer},
   title = {Multi-Agent Reinforcement Learning: Foundations and Modern Approaches},
   publisher = {MIT Press},
   year = {2024},
   url = {https://www.marl-book.com}
}

Elliot Fosong, Arrasy Rahman, Ignacio Carlucho, Stefano V. Albrecht
Learning Complex Teamwork Tasks using a Given Sub-task Decomposition
International Conference on Autonomous Agents and Multi-Agent Systems, 2024
Abstract | BibTex | arXiv | Code
AAMAS multi-agent-rl

@inproceedings{fosongLearningComplexTeamwork2024,
   title = {Learning Complex Teamwork Tasks Using a Given Sub-task Decomposition},
   author = {Fosong, Elliot and Rahman, Arrasy and Carlucho, Ignacio and Albrecht, Stefano V.},
   booktitle = {Proceedings of the 23rd International Conference on Autonomous Agents and Multiagent Systems},
   year = {2024}
}

2023

Arrasy Rahman, Ignacio Carlucho, Niklas Höpner, Stefano V. Albrecht
A General Learning Framework for Open Ad Hoc Teamwork Using Graph-based Policy Learning
Journal of Machine Learning Research, 2023
Abstract | BibTex | arXiv | Publisher | Code
JMLR ad-hoc-teamwork deep-rl agent-modelling multi-agent-rl

@article{JRahman2022POGPL,
   author  = {Arrasy Rahman and Ignacio Carlucho and Niklas H\"opner and Stefano V. Albrecht},
   title   = {A General Learning Framework for Open Ad Hoc Teamwork Using Graph-based Policy Learning},
   journal = {Journal of Machine Learning Research},
   year    = {2023},
   volume  = {24},
   number  = {298},
   pages   = {1--74},
   url     = {http://jmlr.org/papers/v24/22-099.html}
}

Filippos Christianos, Georgios Papoudakis, Stefano V. Albrecht
Pareto Actor-Critic for Equilibrium Selection in Multi-Agent Reinforcement Learning
Transactions on Machine Learning Research, 2023
Abstract | BibTex | arXiv | Code
TMLR deep-rl multi-agent-rl

@inproceedings{christianos2023pareto,
   title={Pareto Actor-Critic for Equilibrium Selection in Multi-Agent Reinforcement Learning},
   author={Filippos Christianos and Georgios Papoudakis and Stefano V. Albrecht},
   journal={Transactions on Machine Learning Research (TMLR)},
   year={2023}
}

Arrasy Rahman, Elliot Fosong, Ignacio Carlucho, Stefano V. Albrecht
Generating Teammates for Training Robust Ad Hoc Teamwork Agents via Best-Response Diversity
Transactions on Machine Learning Research, 2023
Abstract | BibTex | arXiv | Code
TMLR ad-hoc-teamwork multi-agent-rl deep-rl

@article{rahman2023BRDiv,
   title={Generating Teammates for Training Robust Ad Hoc Teamwork Agents via Best-Response Diversity},
   author={Arrasy Rahman and Elliot Fosong and Ignacio Carlucho and Stefano V. Albrecht},
   journal={Transactions on Machine Learning Research (TMLR)},
   year={2023}
}

Lukas Schäfer, Filippos Christianos, Amos Storkey, Stefano V. Albrecht
Learning Task Embeddings for Teamwork Adaptation in Multi-Agent Reinforcement Learning
NeurIPS Workshop on Generalization in Planning, 2023
Abstract | BibTex | arXiv | Code
NeurIPS multi-agent-rl deep-rl

@inproceedings{schaefer2023mate,
   title={Learning Task Embeddings for Teamwork Adaptation in Multi-Agent Reinforcement Learning},
   author={Lukas Schäfer and Filippos Christianos and Amos Storkey and Stefano V. Albrecht},
   booktitle={NeurIPS Workshop on Generalization in Planning},
   year={2023}
}

Filippos Christianos, Georgios Papoudakis, Stefano V. Albrecht
Pareto Actor-Critic for Equilibrium Selection in Multi-Agent Reinforcement Learning
AAMAS Workshop on Optimization and Learning in Multiagent Systems, 2023
Abstract | BibTex | arXiv
AAMAS deep-rl multi-agent-rl

@inproceedings{christianos2023pareto,
   title={Pareto Actor-Critic for Equilibrium Selection in Multi-Agent Reinforcement Learning},
   author={Filippos Christianos and Georgios Papoudakis and Stefano V. Albrecht},
   booktitle={AAMAS Workshop on Optimization and Learning in Multiagent Systems},
   year={2023}
}

Elliot Fosong, Arrasy Rahman, Ignacio Carlucho, Stefano V. Albrecht
Learning Complex Teamwork Tasks Using a Sub-task Curriculum
AAMAS Workshop on Multiagent Sequential Decision Making Under Uncertainty, 2023
Abstract | BibTex | arXiv | Code
AAMAS multi-agent-rl ad-hoc-teamwork transfer-learning

@inproceedings{fosong2023learning,
   title={Learning complex teamwork tasks using a sub-task curriculum},
   author={Elliot Fosong, Arrasy Rahman, Ignacio Carlucho and Stefano V. Albrecht},
   booktitle={AAMAS Workshop on Multiagent Sequential Decision Making under Uncertainty},
   year={2023},
}

Adam Michalski, Filippos Christianos, Stefano V. Albrecht
SMAClite: A Lightweight Environment for Multi-Agent Reinforcement Learning
AAMAS Workshop on Multiagent Sequential Decision Making Under Uncertainty, 2023
Abstract | BibTex | arXiv | Code
AAMAS deep-rl multi-agent-rl

@inproceedings{michalski2023smaclite,
   title={SMAClite: A Lightweight Environment for Multi-Agent Reinforcement Learning},
   author={Adam Michalski and Filippos Christianos and Stefano V. Albrecht},
   booktitle={AAMAS workshop on Multiagent Sequential Decision Making Under Uncertainty (MSDM)},
   year={2023}
}

Lukas Schäfer, Oliver Slumbers, Stephen McAleer, Yali Du, Stefano V. Albrecht, David Mguni
Ensemble Value Functions for Efficient Exploration in Multi-Agent Reinforcement Learning
AAMAS Workshop on Adaptive and Learning Agents, 2023
Abstract | BibTex | arXiv
AAMAS multi-agent-rl deep-rl

@inproceedings{schaefer2023emax,
   title={Ensemble Value Functions for Efficient Exploration in Multi-Agent Reinforcement Learning},
   author={Lukas Schäfer and Oliver Slumbers and Stephen McAleer and Yali Du and Stefano V. Albrecht and David Mguni},
   year={2023},
   booktitle={AAMAS Workshop on Adaptive and Learning Agents (ALA)},
}

Callum Tilbury, Filippos Christianos, Stefano V. Albrecht
Revisiting the Gumbel-Softmax in MADDPG
AAMAS Workshop on Adaptive and Learning Agents, 2023
Abstract | BibTex | arXiv | Code
AAMAS multi-agent-rl deep-rl

@inproceedings{tilbury2023revisitingmaddpg,
   title={Revisiting the Gumbel-Softmax in MADDPG},
   author={Callum Tilbury and Filippos Christianos and Stefano V. Albrecht},
   year={2023},
   booktitle={AAMAS Workshop on Adaptive and Learning Agents (ALA)},
}

Aleksandar Krnjaic, Raul D. Steleac, Jonathan D. Thomas, Georgios Papoudakis, Lukas Schäfer, Andrew Wing Keung To, Kuan-Ho Lao, Murat Cubuktepe, Matthew Haley, Peter Börsting, Stefano V. Albrecht
Scalable Multi-Agent Reinforcement Learning for Warehouse Logistics with Robotic and Human Co-Workers
arXiv:2212.11498, 2023
Abstract | BibTex | arXiv | Website
multi-agent-rl simulator

@misc{krnjaic2023scalable,
   title={Scalable Multi-Agent Reinforcement Learning for Warehouse Logistics with Robotic and Human Co-Workers},
   author={Aleksandar Krnjaic and Raul D. Steleac and Jonathan D. Thomas and Georgios Papoudakis and Lukas Sch\"afer and Andrew Wing Keung To and Kuan-Ho Lao and Murat Cubuktepe and Matthew Haley and Peter B\"orsting and Stefano V. Albrecht},
   year={2023},
   eprint={2212.11498},
   archivePrefix={arXiv},
   primaryClass={cs.LG}
}

2022

Stefano V. Albrecht, Michael Wooldridge
Special Issue on Multi-Agent Systems Research in the United Kingdom: Guest Editorial
AI Communications, 2022
Abstract | BibTex | Publisher | Special Issue
AIC survey deep-rl multi-agent-rl agent-modelling

@article{albrecht2020special,
   title = {Special Issue on Multi-Agent Systems Research in the United Kingdom: Guest Editorial},
   author = {Stefano V. Albrecht and Michael Wooldridge},
   journal = {AI Communications},
   volume = {35},
   number = {4},
   year = {2022},
   publisher = {IOS Press},
   url = {https://content.iospress.com/articles/ai-communications/aic229003}
}

Ibrahim H. Ahmed, Cillian Brewitt, Ignacio Carlucho, Filippos Christianos, Mhairi Dunion, Elliot Fosong, Samuel Garcin, Shangmin Guo, Balint Gyevnar, Trevor McInroe, Georgios Papoudakis, Arrasy Rahman, Lukas Schäfer, Massimiliano Tamborski, Giuseppe Vecchio, Cheng Wang, Stefano V. Albrecht
Deep Reinforcement Learning for Multi-Agent Interaction
AI Communications, 2022
Abstract | BibTex | arXiv | Publisher
AIC survey deep-rl multi-agent-rl ad-hoc-teamwork agent-modelling goal-recognition security explainable-ai autonomous-driving

@article{albrecht2022aic,
   author = {Ahmed, Ibrahim H. and Brewitt, Cillian and Carlucho, Ignacio and Christianos, Filippos and Dunion, Mhairi and Fosong, Elliot and Garcin, Samuel and Guo, Shangmin and Gyevnar, Balint and McInroe, Trevor and Papoudakis, Georgios and Rahman, Arrasy and Schäfer, Lukas and Tamborski, Massimiliano and Vecchio, Giuseppe and Wang, Cheng and Albrecht, Stefano V.},
   title = {Deep Reinforcement Learning for Multi-Agent Interaction},
   journal = {AI Communications, Special Issue on Multi-Agent Systems Research in the UK},
   year = {2022}
}

Shangmin Guo, Yi Ren, Kory Mathewson, Simon Kirby, Stefano V. Albrecht, Kenny Smith
Expressivity of Emergent Languages is a Trade-off between Contextual Complexity and Unpredictability
International Conference on Learning Representations, 2022
Abstract | BibTex | arXiv | Code
ICLR multi-agent-rl emergent-communication

@inproceedings{guo2022expressivity,
   title={Expressivity of Emergent Languages is a Trade-off between Contextual Complexity and Unpredictability},
   author={Shangmin Guo and Yi Ren and Kory Mathewson and Simon Kirby and Stefano V. Albrecht and Kenny Smith},
   booktitle={International Conference on Learning Representations (ICLR)},
   year={2022}
}

Arrasy Rahman, Elliot Fosong, Ignacio Carlucho, Stefano V. Albrecht
Towards Robust Ad Hoc Teamwork Agents By Creating Diverse Training Teammates
IJCAI Workshop on Ad Hoc Teamwork, 2022
Abstract | BibTex | arXiv | Code
IJCAI ad-hoc-teamwork multi-agent-rl

@inproceedings{rahman2022towards,
   title={Towards Robust Ad Hoc Teamwork Agents By Creating Diverse Training Teammates},
   author={Arrasy Rahman and Elliot Fosong and Ignacio Carlucho and Stefano V. Albrecht},
   booktitle={IJCAI Workshop on Ad Hoc Teamwork},
   year={2022}
}

Elliot Fosong, Arrasy Rahman, Ignacio Carlucho, Stefano V. Albrecht
Few-Shot Teamwork
IJCAI Workshop on Ad Hoc Teamwork, 2022
Abstract | BibTex | arXiv
IJCAI ad-hoc-teamwork multi-agent-rl

@inproceedings{fosong2022fewshot,
   title={Few-Shot Teamwork},
   author={Elliot Fosong and Arrasy Rahman and Ignacio Carlucho and Stefano V. Albrecht},
   booktitle={IJCAI Workshop on Ad Hoc Teamwork},
   year={2022}
}

Ignacio Carlucho, Arrasy Rahman, William Ard, Elliot Fosong, Corina Barbalata, Stefano V. Albrecht
Cooperative Marine Operations Via Ad Hoc Teams
IJCAI Workshop on Ad Hoc Teamwork, 2022
Abstract | BibTex | arXiv
IJCAI ad-hoc-teamwork multi-agent-rl

@inproceedings{Carlucho2022UnderwaterAHT,
   title={Cooperative Marine Operations Via Ad Hoc Teams},
   author={Ignacio Carlucho, Arrasy Rahman, William Ard, Elliot Fosong, Corina Barbalata, Stefano V. Albrecht},
   booktitle={IJCAI Workshop on Ad Hoc Teamwork},
   year={2022}
}

Aleksandar Krnjaic, Jonathan D. Thomas, Georgios Papoudakis, Lukas Schäfer, Peter Börsting, Stefano V. Albrecht
Scalable Multi-Agent Reinforcement Learning for Warehouse Logistics with Robotic and Human Co-Workers
arXiv:2212.11498, 2022
Abstract | BibTex | arXiv
deep-rl multi-agent-rl

@misc{Krnjaic2022HSNAC,
   title={Scalable Multi-Agent Reinforcement Learning for Warehouse Logistics with Robotic and Human Co-Workers},
   author={Aleksandar Krnjaic and Jonathan D. Thomas and Georgios Papoudakis and Lukas Sch\"afer and Peter B\"orsting and Stefano V. Albrecht,
   year={2022},
   eprint={2212.11498},
   archivePrefix={arXiv}
}

Lukas Schäfer, Filippos Christianos, Amos Storkey, Stefano V. Albrecht
Learning Task Embeddings for Teamwork Adaptation in Multi-Agent Reinforcement Learning
arxiv:2207.02249, 2022
Abstract | BibTex | arXiv
deep-rl multi-agent-rl

@misc{schaefer2022mate,
   title={Learning Task Embeddings for Teamwork Adaptation in Multi-Agent Reinforcement Learning},
   author={Lukas Schäfer and Filippos Christianos and Amos Storkey and Stefano V. Albrecht},
   year={2022},
   eprint={2207.02249},
   archivePrefix={arXiv},
   primaryClass={cs.MA}
}

Filippos Christianos, Georgios Papoudakis, Stefano V. Albrecht
Pareto Actor-Critic for Equilibrium Selection in Multi-Agent Reinforcement Learning
arXiv:2209.14344, 2022
Abstract | BibTex | arXiv
deep-rl multi-agent-rl

@misc{christianos2022pareto,
   title={Pareto Actor-Critic for Equilibrium Selection in Multi-Agent Reinforcement Learning},
   author={Filippos Christianos and Georgios Papoudakis and Stefano V. Albrecht},
   year={2022},
   eprint={2209.14344},
   archivePrefix={arXiv},
   primaryClass={cs.LG}
}

2021

Georgios Papoudakis, Filippos Christianos, Lukas Schäfer, Stefano V. Albrecht
Benchmarking Multi-Agent Deep Reinforcement Learning Algorithms in Cooperative Tasks
Conference on Neural Information Processing Systems, Datasets and Benchmarks Track, 2021
Abstract | BibTex | arXiv | Code
NeurIPS deep-rl multi-agent-rl

@inproceedings{papoudakis2021benchmarking,
   title={Benchmarking Multi-Agent Deep Reinforcement Learning Algorithms in Cooperative Tasks},
   author={Georgios Papoudakis and Filippos Christianos and Lukas Sch\"afer and Stefano V. Albrecht},
   booktitle = {Proceedings of the Neural Information Processing Systems Track on Datasets and Benchmarks (NeurIPS)},
   year={2021},
   url = {http://arxiv.org/abs/2006.07869},
   openreview = {https://openreview.net/forum?id=cIrPX-Sn5n},
   code = {https://github.com/uoe-agents/epymarl}
}

Filippos Christianos, Georgios Papoudakis, Arrasy Rahman, Stefano V. Albrecht
Scaling Multi-Agent Reinforcement Learning with Selective Parameter Sharing
International Conference on Machine Learning, 2021
Abstract | BibTex | arXiv | Video | Code
ICML deep-rl multi-agent-rl

@inproceedings{christianos2021scaling,
   title={Scaling Multi-Agent Reinforcement Learning with Selective Parameter Sharing},
   author={Filippos Christianos and Georgios Papoudakis and Arrasy Rahman and Stefano V. Albrecht},
   booktitle={International Conference on Machine Learning (ICML)},
   year={2021}
}

Shangmin Guo, Yi Ren, Kory Mathewson, Simon Kirby, Stefano V. Albrecht, Kenny Smith
Expressivity of Emergent Language is a Trade-off between Contextual Complexity and Unpredictability
arXiv:2106.03982, 2021
Abstract | BibTex | arXiv
multi-agent-rl emergent-communication

@misc{guo2021expressivity,
   title={Expressivity of Emergent Language is a Trade-off between Contextual Complexity and Unpredictability},
   author={Shangmin Guo and Yi Ren and Kory Mathewson and Simon Kirby and Stefano V. Albrecht and Kenny Smith},
   year={2021},
   eprint={2106.03982},
   archivePrefix={arXiv},
   primaryClass={cs.CL}
}

2020

Filippos Christianos, Lukas Schäfer, Stefano V. Albrecht
Shared Experience Actor-Critic for Multi-Agent Reinforcement Learning
Conference on Neural Information Processing Systems, 2020
Abstract | BibTex | arXiv
NeurIPS deep-rl multi-agent-rl

@inproceedings{christianos2020shared,
   title={Shared Experience Actor-Critic for Multi-Agent Reinforcement Learning},
   author={Filippos Christianos and Lukas Sch\"afer and Stefano V. Albrecht},
   booktitle={34th Conference on Neural Information Processing Systems},
   year={2020}
}

Georgios Papoudakis, Filippos Christianos , Lukas Schäfer, Stefano V. Albrecht
Comparative Evaluation of Multi-Agent Deep Reinforcement Learning Algorithms
arXiv:2006.07869, 2020
Abstract | BibTex | arXiv
deep-rl multi-agent-rl

@misc{papoudakis2020comparative,
   title={Comparative Evaluation of Multi-Agent Deep Reinforcement Learning Algorithms},
   author={Georgios Papoudakis and Filippos Christianos and Lukas Sch\"afer and Stefano V. Albrecht},
   year={2020},
   eprint={2006.07869},
   archivePrefix={arXiv},
   primaryClass={cs.LG}
}

2019

Georgios Papoudakis, Filippos Christianos, Arrasy Rahman, Stefano V. Albrecht
Dealing with Non-Stationarity in Multi-Agent Deep Reinforcement Learning
arXiv:1906.04737, 2019
Abstract | BibTex | arXiv
survey deep-rl multi-agent-rl

@misc{papoudakis2019dealing,
   title={Dealing with Non-Stationarity in Multi-Agent Deep Reinforcement Learning},
   author={Georgios Papoudakis and Filippos Christianos and Arrasy Rahman and Stefano V. Albrecht},
   year={2019},
   eprint={1906.04737},
   archivePrefix={arXiv},
   primaryClass={cs.LG}
}

2012

Stefano V. Albrecht, Subramanian Ramamoorthy
Comparative Evaluation of Multiagent Learning Algorithms in a Diverse Set of Ad Hoc Team Problems
International Conference on Autonomous Agents and Multiagent Systems, 2012
Abstract | BibTex | arXiv
AAMAS multi-agent-rl ad-hoc-teamwork

@inproceedings{ albrecht2012comparative,
   title = {Comparative Evaluation of {MAL} Algorithms in a Diverse Set of Ad Hoc Team Problems},
   author = {Stefano V. Albrecht and Subramanian Ramamoorthy},
   booktitle = {Proceedings of the 11th International Conference on Autonomous Agents and Multiagent Systems},
   pages = {349--356},
   year = {2012}
}