I gave a talk at the JADE (UK Supercomputing Facility) 2023 event. We discussed why egocentric vision is important, and the computational requirements of egocentric datasets and video understanding models.
I gave a talk at Samsung AI Centre Cambridge. We looked at the difficulties of scaling few-shot models to handle long-tail tasks.
Feb 10, 2023
I gave a talk at the University of Exeter Computer Science Seminar Series. This included a brief history of image and video datasets, how their properties can cause models to take shortcuts, and some recent solutions.
@inproceedings{perrett2025hdepic,author={Perrett, Toby and Darkhalil, Ahmad and Sinha, Saptarshi and Emara, Omar and Pollard, Sam and Parida, Kranti and Liu, Kaiting and Gatti, Prajwal and Bansal, Siddhant and Flanagan, Kevin and Chalk, Jacob and Zhu, Zhifan and Guerrier, Rhodri and Abdelazim, Fahd and Zhu, Bin and Moltisanti, Davide and Wray, Michael and Doughty, Hazel and Damen, Dima},title={HD-EPIC: A Highly-Detailed Egocentric Video Dataset},booktitle={CVPR},year={2025},}
Spatial Cognition from Egocentric Video: Out of Sight, Not Out of Mind
Chiara Plizzari, Shubham Goel, Toby Perrett, Jacob Chalk, Angjoo Kanazawa, and Dima Damen
@inproceedings{Plizzari2023osnom,title={Spatial Cognition from Egocentric Video: Out of Sight, Not Out of Mind},author={Plizzari, Chiara and Goel, Shubham and Perrett, Toby and Chalk, Jacob and Kanazawa, Angjoo and Damen, Dima},booktitle={3DV},year={2025},}
2024
It’s Just Another Day: Unique Captioning by Discriminative Prompting
Toby Perrett, Tengda Han, Dima Damen, and Andrew Zisserman
@inproceedings{Perrett2024unique,title={It's Just Another Day: Unique Captioning by Discriminative Prompting},author={Perrett, Toby and Han, Tengda and Damen, Dima and Zisserman, Andrew},booktitle={ACCV (Best Paper Award)},year={2024},}
2023
Use Your Head: Improving Long-Tail Video Recognition
@inproceedings{Perrett2023,title={Use Your Head: Improving Long-Tail Video Recognition},author={Perrett, Toby and Sinha, Saptarshi and Burghardt, Tilo and Mirmehdi, Majid and Damen, Dima},booktitle={CVPR},year={2023},}
2022
Rescaling Egocentric Vision: Collection, Pipeline and Challenges for EPIC-KITCHENS-100
Dima Damen, Hazel Doughty, Giovanni Maria Farinella, Antonino Furnari, Evangelos Kazakos, Jian Ma, Davide Moltisanti, Jonathan Munro, Toby Perrett, Will Price, and Michael Wray
@article{Damen2022,author={Damen, Dima and Doughty, Hazel and Farinella, Giovanni Maria and Furnari, Antonino and Kazakos, Evangelos and Ma, Jian and Moltisanti, Davide and Munro, Jonathan and Perrett, Toby and Price, Will and Wray, Michael},journal={IJCV},title={{Rescaling Egocentric Vision: Collection, Pipeline and Challenges for EPIC-KITCHENS-100}},year={2022},}
2021
Temporal-Relational CrossTransformers for Few-Shot Action Recognition
@inproceedings{Perrett2021,title={Temporal-Relational CrossTransformers for Few-Shot Action Recognition},author={Perrett, Toby and Masullo, Alessandro and Burghardt, Tilo and Mirmehdi, Majid and Damen, Dima},booktitle={CVPR},year={2021},}
2019
DDLSTM: Dual-Domain LSTM for Cross-Domain Action Recognition
@inproceedings{Perrett2019,title={DDLSTM: Dual-Domain LSTM for Cross-Domain Action Recognition},author={Perrett, Toby and Damen, Dima},booktitle={CVPR},year={2019},}
2018
Scaling Egocentric Vision: The EPIC-KITCHENS Dataset
Dima Damen, Hazel Doughty, Giovanni Maria Farinella, Sanja Fidler, Antonino Furnari, Evangelos Kazakos, Davide Moltisanti, Jonathan Munro, Toby Perrett, Will Price, and Michael Wray
@inproceedings{Damen2018EPICKITCHENS,author={Damen, Dima and Doughty, Hazel and Farinella, Giovanni Maria and Fidler, Sanja and Furnari, Antonino and Kazakos, Evangelos and Moltisanti, Davide and Munro, Jonathan and Perrett, Toby and Price, Will and Wray, Michael},booktitle={ECCV},title={{Scaling Egocentric Vision: The EPIC-KITCHENS Dataset}},year={2018},}