Publications

For news about publications, follow us on X/Twitter:

Click on any author names or tags to filter publications.

All topic tags:
survey deep-rl multi-agent-rl agent-modelling ad-hoc-teamwork autonomous-driving goal-recognition explainable-ai causal generalisation security emergent-communication iterated-learning intrinsic-reward simulator state-estimation deep-learning transfer-learning

Selected tags (click to remove):
Shangmin-Guo

2024

Samuel Garcin, James Doran, Shangmin Guo, Christopher G. Lucas, Stefano V. Albrecht
DRED: Zero-Shot Transfer in Reinforcement Learning via Data-Regularised Environment Design
International Conference on Machine Learning, 2024
Abstract | BibTex | arXiv
ICML deep-rl

@inproceedings{garcin2024dred,
   title={{DRED}: Zero-Shot Transfer in Reinforcement Learning via Data-Regularised Environment Design},
   author={Samuel Garcin and James Doran and Shangmin Guo and Christopher G. Lucas and Stefano V. Albrecht},
   year={2024},
   booktitle={International Conference on Machine Learning (ICML)}
}

Shangmin Guo, Yi Ren, Stefano V. Albrecht, Kenny Smith
lpNTK: Better Generalisation with Less Data via Sample Interaction During Learning
International Conference on Learning Representations, 2024
Abstract | BibTex | arXiv | Code
ICLR deep-learning

@inproceedings{guo2024lpntk,
   title={Sample Relationship from Learning Dynamics Matters for Generalisation},
   author={Shangmin Guo and Yi Ren and Stefano V. Albrecht and Kenny Smith},
   booktitle={12th International Conference on Learning Representations},
   year={2024},
   url={https://openreview.net/forum?id=8Ju0VmvMCW}
}

2023

Samuel Garcin, James Doran, Shangmin Guo, Christopher G. Lucas, Stefano V. Albrecht
How the level sampling process impacts zero-shot generalisation in deep reinforcement learning
NeurIPS Workshop on Agent Learning in Open-Endedness, 2023
Abstract | BibTex | arXiv
NeurIPS deep-rl

@inproceedings{garcin2023level,
   title={How the level sampling process impacts zero-shot generalisation in deep reinforcement learning},
   author={Samuel Garcin and James Doran and Shangmin Guo and Christopher G. Lucas and Stefano V. Albrecht},
   booktitle={NeurIPS Workshop on Agent Learning in Open-Endedness},
   year={2023}
}

Yi Ren, Shangmin Guo, Wonho Bae, Danica J. Sutherland
How to Prepare Your Task Head for Finetuning
International Conference on Learning Representations, 2023
Abstract | BibTex | arXiv
ICLR deep-learning transfer-learning

@inproceedings{ ren2023how,
   title={How to Prepare Your Task Head for Finetuning},
   author={Yi Ren and Shangmin Guo and Wonho Bae and Danica J. Sutherland},
   booktitle={International Conference on Learning Representations (ICLR)},
   year={2023},
   url={https://openreview.net/forum?id=gVOXZproe-e}
}

Samuel Garcin, James Doran, Shangmin Guo, Christopher G. Lucas, Stefano V. Albrecht
How the level sampling process impacts zero-shot generalisation in deep reinforcement learning
arXiv:2310.03494, 2023
Abstract | BibTex | arXiv
deep-rl

@misc{garcin2023level,
   title={How the level sampling process impacts zero-shot generalisation in deep reinforcement learning},
   author={Samuel Garcin and James Doran and Shangmin Guo and Christopher G. Lucas and Stefano V. Albrecht},
   year={2023},
   eprint={2310.03494},
   archivePrefix={arXiv},
   primaryClass={cs.LG}
}

2022

Ibrahim H. Ahmed, Cillian Brewitt, Ignacio Carlucho, Filippos Christianos, Mhairi Dunion, Elliot Fosong, Samuel Garcin, Shangmin Guo, Balint Gyevnar, Trevor McInroe, Georgios Papoudakis, Arrasy Rahman, Lukas Schäfer, Massimiliano Tamborski, Giuseppe Vecchio, Cheng Wang, Stefano V. Albrecht
Deep Reinforcement Learning for Multi-Agent Interaction
AI Communications, 2022
Abstract | BibTex | arXiv | Publisher
AIC survey deep-rl multi-agent-rl ad-hoc-teamwork agent-modelling goal-recognition security explainable-ai autonomous-driving

@article{albrecht2022aic,
   author = {Ahmed, Ibrahim H. and Brewitt, Cillian and Carlucho, Ignacio and Christianos, Filippos and Dunion, Mhairi and Fosong, Elliot and Garcin, Samuel and Guo, Shangmin and Gyevnar, Balint and McInroe, Trevor and Papoudakis, Georgios and Rahman, Arrasy and Schäfer, Lukas and Tamborski, Massimiliano and Vecchio, Giuseppe and Wang, Cheng and Albrecht, Stefano V.},
   title = {Deep Reinforcement Learning for Multi-Agent Interaction},
   journal = {AI Communications, Special Issue on Multi-Agent Systems Research in the UK},
   year = {2022}
}

Shangmin Guo, Yi Ren, Stefano V. Albrecht, Kenny Smith
Sample Relationships through the Lens of Learning Dynamics with Label Information
NeurIPS Workshop on Interpolation and Beyond, 2022
Abstract | BibTex | arXiv
NeurIPS iterated-learning deep-learning transfer-learning

@inproceedings{guo2022relationship,
   title={Sample Relationships through the Lens of Learning Dynamics with Label Information},
   author={Shangmin Guo and Yi Ren and Stefano V. Albrecht and Kenny Smith},
   booktitle={NeurIPS 2022 Workshop on Interpolation and Beyond},
   year={2022}
}

Shangmin Guo, Yi Ren, Kory Mathewson, Simon Kirby, Stefano V. Albrecht, Kenny Smith
Expressivity of Emergent Languages is a Trade-off between Contextual Complexity and Unpredictability
International Conference on Learning Representations, 2022
Abstract | BibTex | arXiv | Code
ICLR multi-agent-rl emergent-communication

@inproceedings{guo2022expressivity,
   title={Expressivity of Emergent Languages is a Trade-off between Contextual Complexity and Unpredictability},
   author={Shangmin Guo and Yi Ren and Kory Mathewson and Simon Kirby and Stefano V. Albrecht and Kenny Smith},
   booktitle={International Conference on Learning Representations (ICLR)},
   year={2022}
}

2021

Shangmin Guo, Yi Ren, Kory Mathewson, Simon Kirby, Stefano V. Albrecht, Kenny Smith
Expressivity of Emergent Language is a Trade-off between Contextual Complexity and Unpredictability
arXiv:2106.03982, 2021
Abstract | BibTex | arXiv
multi-agent-rl emergent-communication

@misc{guo2021expressivity,
   title={Expressivity of Emergent Language is a Trade-off between Contextual Complexity and Unpredictability},
   author={Shangmin Guo and Yi Ren and Kory Mathewson and Simon Kirby and Stefano V. Albrecht and Kenny Smith},
   year={2021},
   eprint={2106.03982},
   archivePrefix={arXiv},
   primaryClass={cs.CL}
}