I received a PhD degree in Mathematics and Computer Science in 2017 from the University of Catania advised by Prof. Giovanni Maria Farinella and Prof. Sebastiano Battiato, and spent time as a visiting researcher at the University of Texas at Austin advised by Prof. Kristen Grauman and at the University of Bristol advised by Prof. Dima Damen.
I teach a Bachelor course on Computer Programming and a Master course on Fundamentals of Data Analysis for which I proudly share open source notes here. I supervised more than 30 bachelor and master theses and supervised/currently supervising 8 PhD students.
I am passionate about making things work, understanding what great minds have discovered in the past and are discovering in the present, and humbly contributing to shaping the technology of the future.
My research focuses on understanding human activity and future intent from egocentric video, and building assistive systems which can support and empower humans. See this page for selected research highlights and this page for the full list of publications.
Lorenzo Mur-Labadia, Ruben Martinez-Cantin, Josechu Guerrero, Giovanni Maria Farinella, Antonino Furnari. AFF-ttention! Affordances and Attention models for Short-Term Object Interaction Anticipation. [Paper]
Camillo Quattrocchi, Antonino Furnari, Daniele Di Mauro, Mario Valerio Giuffrida, Giovanni Maria Farinella. Synchronization is All You Need: Exocentric-to-Egocentric Transfer for Temporal Action Segmentation with Unlabeled Synchronized Video Pairs. [Paper]
Rosario Leonardi, Antonino Furnari, Francesco Ragusa, Giovanni Maria Farinella. Are Synthetic Data Useful for Egocentric Hand-Object Interaction Detection? [Paper]
Jun 2024
We are among winners of two challenges at the EgoVis workshop:
🥇 1st place at the EgoVis HoloLens Mistake Detection Challenge with a solution based on gaze analysis detailed here.
Three papers accepted at CVPR 2024! (1 oral + 2 posters):
Alessandro Flaborea, Guido Maria D'Amely di Melendugno, Leonardo Plini, Luca Scofano, Edoardo De Matteis, Antonino Furnari, Giovanni Maria Farinella, Fabio Galasso. PREGO: online mistake detection in PRocedural EGOcentric videos[Paper]
Ivan Rodin, Antonino Furnari, Kyle Min, Subarna Tripathi, Giovanni Maria Farinella. Action Scene Graphs for Long-Form Understanding of Egocentric Videos. [Paper]
Ego-Exo4D: Understanding Skilled Human Activity from First- and Third-Person Perspectives. With other 100 authors! Oral < 1% accept rate.[Paper]
Short list of selected research projects. Click here for a full list. Click here for the full list of publications.
@inproceedings{seminara2024differentiable, author = {Seminara, Luigi and Farinella, Giovanni Maria and Furnari, Antonino}, booktitle = {Advances in Neural Information Processing Systems}, title = {Differentiable Task Graph Learning: Procedural Activity Representation and Online Mistake Detection from Egocentric Videos}, pdf = {https://arxiv.org/pdf/2406.01486.pdf}, url = {https://github.com/fpv-iplab/Differentiable-Task-Graph-Learning}, year = {2024} }
@inproceedings{mur-labadia2024AFF-ttention,
pdf = { https://arxiv.org/pdf/2406.01194.pdf },
year = { 2024 },
booktitle = { European Conference on Computer Vision (ECCV) },
title = { AFF-ttention! Affordances and Attention models for Short-Term Object Interaction Anticipation },
author = { Lorenzo Mur-Labadia and Ruben Martinez-Cantin and Josechu Guerrero and Giovanni Maria Farinella and Antonino Furnari },
url = {https://github.com/lmur98/AFFttention}
}
@inproceedings{quattrocchi2024synchronization, pdf = { https://arxiv.org/pdf/2312.02638.pdf }, year = { 2024 }, booktitle = { European Conference on Computer Vision (ECCV) }, title = { Synchronization is All You Need: Exocentric-to-Egocentric Transfer for Temporal Action Segmentation with Unlabeled Synchronized Video Pairs }, author = { Camillo Quattrocchi and Antonino Furnari and Daniele Di Mauro and Mario Valerio Giuffrida and Giovanni Maria Farinella }, url = {https://github.com/fpv-iplab/synchronization-is-all-you-need} }
@inproceedings{leonardi2024synthetic, pdf = { https://arxiv.org/pdf/2312.02672.pdf }, year = { 2024 }, booktitle = { European Conference on Computer Vision (ECCV) }, title = { Are Synthetic Data Useful for Egocentric Hand-Object Interaction Detection? }, author = { Rosario Leonardi and Antonino Furnari and Francesco Ragusa and Giovanni Maria Farinella }, url = {https://github.com/fpv-iplab/HOI-Synth} }
@inproceedings{flaborea2024PREGO, year = { 2024 }, booktitle = { Conference on Computer Vision and Pattern Recognition (CVPR) }, title = { PREGO: online mistake detection in PRocedural EGOcentric videos }, author = { Alessandro Flaborea and Guido D'Amely and Leonardo Plini and Luca Scofano and Edoardo De Matteis and Antonino Furnari and Giovanni Maria Farinella and Fabio Galasso }, pdf={https://arxiv.org/pdf/2404.01933.pdf}, url={https://github.com/aleflabo/PREGO?tab=readme-ov-file} }
@inproceedings{grauman2023egoexo4d, primaryclass = { cs.CV }, archiveprefix = { arXiv }, eprint = { 2311.18259 }, pdf = { https://arxiv.org/pdf/2311.18259.pdf }, url = { https://ego-exo4d-data.org/ }, year = { 2024 }, booktitle = { Conference on Computer Vision and Pattern Recognition (CVPR) }, title = { Ego-Exo4D: Understanding Skilled Human Activity from First- and Third-Person Perspectives }, author = { Kristen Grauman and Andrew Westbury and Lorenzo Torresani and Kris Kitani and Jitendra Malik and Triantafyllos Afouras and Kumar Ashutosh and Vijay Baiyya and Siddhant Bansal and Bikram Boote and Eugene Byrne and Zach Chavis and Joya Chen and Feng Cheng and Fu-Jen Chu and Sean Crane and Avijit Dasgupta and Jing Dong and Maria Escobar and Cristhian Forigua and Abrham Gebreselasie and Sanjay Haresh and Jing Huang and Md Mohaiminul Islam and Suyog Jain and Rawal Khirodkar and Devansh Kukreja and Kevin J Liang and Jia-Wei Liu and Sagnik Majumder and Yongsen Mao and Miguel Martin and Effrosyni Mavroudi and Tushar Nagarajan and Francesco Ragusa and Santhosh Kumar Ramakrishnan and Luigi Seminara and Arjun Somayazulu and Yale Song and Shan Su and Zihui Xue and Edward Zhang and Jinxu Zhang and Angela Castillo and Changan Chen and Xinzhu Fu and Ryosuke Furuta and Cristina Gonzalez and Prince Gupta and Jiabo Hu and Yifei Huang and Yiming Huang and Weslie Khoo and Anush Kumar and Robert Kuo and Sach Lakhavani and Miao Liu and Mi Luo and Zhengyi Luo and Brighid Meredith and Austin Miller and Oluwatumininu Oguntola and Xiaqing Pan and Penny Peng and Shraman Pramanick and Merey Ramazanova and Fiona Ryan and Wei Shan and Kiran Somasundaram and Chenan Song and Audrey Southerland and Masatoshi Tateno and Huiyu Wang and Yuchen Wang and Takuma Yagi and Mingfei Yan and Xitong Yang and Zecheng Yu and Shengxin Cindy Zha and Chen Zhao and Ziwei Zhao and Zhifan Zhu and Jeff Zhuo and Pablo Arbelaez and Gedas Bertasius and David Crandall and Dima Damen and Jakob Engel and Giovanni Maria Farinella and Antonino Furnari and Bernard Ghanem and Judy Hoffman and C. V. Jawahar and Richard Newcombe and Hyun Soo Park and James M. Rehg and Yoichi Sato and Manolis Savva and Jianbo Shi and Mike Zheng Shou and Michael Wray }, }
@inproceedings{rodin2023action, primaryclass = { cs.CV }, archiveprefix = { arXiv }, eprint = { 2312.03391 }, pdf = { https://arxiv.org/pdf/2312.03391.pdf }, year = { 2024 }, booktitle = { Conference on Computer Vision and Pattern Recognition (CVPR) }, title = { Action Scene Graphs for Long-Form Understanding of Egocentric Videos }, author = { Ivan Rodin and Antonino Furnari and Kyle Min and Subarna Tripathi and Giovanni Maria Farinella }, url = {https://github.com/fpv-iplab/EASG} }
@article{Plizzari2024AnOutlook, author = { Chiara Plizzari and Gabriele Goletto and Antonino Furnari and Siddhant Bansal and Francesco Ragusa and Giovanni Maria Farinella and Dima Damen and Tatiana Tommasi }, journal = { International Journal of Computer Vision (IJCV) }, title = { An Outlook into the Future of Egocentric Vision }, year = { 2024 }, url = { https://link.springer.com/article/10.1007/s11263-024-02095-7 }, pdf = { https://link.springer.com/content/pdf/10.1007/s11263-024-02095-7.pdf }, doi = { }, }
@InProceedings{ragusa2023stillfast, author={Francesco Ragusa and Giovanni Maria Farinella and Antonino Furnari}, title={StillFast: An End-to-End Approach for Short-Term Object Interaction Anticipation}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) Workshops}, year = {2023}, pdf={https://arxiv.org/pdf/2304.03959.pdf}, url={https://iplab.dmi.unict.it/stillfast/} }
@article{Damen2021rescaling, title = {Rescaling Egocentric Vision: Collection, Pipeline and Challenges for EPIC-KITCHENS-100}, author = {Damen, Dima and Doughty, Hazel and Farinella, Giovanni Maria and Furnari, Antonino and Kazakos, Evangelos and Ma, Jian and Moltisanti, Davide and Munro, Jonathan and Perrett, Toby and Price, Will and Wray, Michael}, journal = {International Journal on Computer Vision (IJCV)}, volume = {130}, pages={33-55}, year = {2022}, url = {http://epic-kitchens.github.io/2020-100}, pdf = {http://arxiv.org/pdf/2006.13256.pdf}, }
@inproceedings{grauman2022around, author = { Kristen Grauman and Andrew Westbury and Eugene Byrne and Zachary Chavis and Antonino Furnari and Rohit Girdhar and Jackson Hamburger and Hao Jiang and Miao Liu and Xingyu Liu and Miguel Martin and Tushar Nagarajan and Ilija Radosavovic and Santhosh Kumar Ramakrishnan and Fiona Ryan and Jayant Sharma and Michael Wray and Mengmeng Xu and Eric Zhongcong Xu and Chen Zhao and Siddhant Bansal and Dhruv Batra and Vincent Cartillier and Sean Crane and Tien Do and Morrie Doulaty and Akshay Erapalli and Christoph Feichtenhofer and Adriano Fragomeni and Qichen Fu and Christian Fuegen and Abrham Gebreselasie and Cristina Gonzalez and James Hillis and Xuhua Huang and Yifei Huang and Wenqi Jia and Weslie Khoo and Jachym Kolar and Satwik Kottur and Anurag Kumar and Federico Landini and Chao Li and Yanghao Li and Zhenqiang Li and Karttikeya Mangalam and Raghava Modhugu and Jonathan Munro and Tullie Murrell and Takumi Nishiyasu and Will Price and Paola Ruiz Puentes and Merey Ramazanova and Leda Sari and Kiran Somasundaram and Audrey Southerland and Yusuke Sugano and Ruijie Tao and Minh Vo and Yuchen Wang and Xindi Wu and Takuma Yagi and Yunyi Zhu and Pablo Arbelaez and David Crandall and Dima Damen and Giovanni Maria Farinella and Bernard Ghanem and Vamsi Krishna Ithapu and C. V. Jawahar and Hanbyul Joo and Kris Kitani and Haizhou Li and Richard Newcombe and Aude Oliva and Hyun Soo Park and James M. Rehg and Yoichi Sato and Jianbo Shi and Mike Zheng Shou and Antonio Torralba and Lorenzo Torresani and Mingfei Yan and Jitendra Malik }, title = { Around the {W}orld in 3,000 {H}ours of {E}gocentric {V}ideo }, booktitle = { IEEE/CVF International Conference on Computer Vision and Pattern Recognition }, year = {2022}, pdf = { https://arxiv.org/pdf/2110.07058.pdf }, url = { https://ego4d-data.org/ }, }
@inproceedings{ragusa2021meccano, pdf = { https://arxiv.org/pdf/2010.05654.pdf }, url = { https://iplab.dmi.unict.it/MECCANO }, primaryclass = { cs.CV }, booktitle={IEEE Winter Conference on Application of Computer Vision (WACV)}, eprint = { 2010.05654 }, year = {2021}, author = {Francesco Ragusa and Antonino Furnari and Salvatore Livatino and Giovanni Maria Farinella}, title = {The MECCANO Dataset: Understanding Human-Object Interactions from Egocentric Videos in an Industrial-like Domain} }
@article{ragusa2023meccano, year = {2023}, title = {MECCANO: A Multimodal Egocentric Dataset for Humans Behavior Understanding in the Industrial-like Domain}, journal = {Computer Vision and Image Understanding (CVIU)}, author = {Francesco Ragusa and Antonino Furnari and Giovanni Maria Farinella}, url = {https://arxiv.org/abs/2209.08691} }
@article{rodin2021predicting, title={Predicting the Future from First Person (Egocentric) Vision: A Survey}, author={Ivan Rodin and Antonino Furnari and Dimitrios Mavroedis and Giovanni Maria Farinella}, year={2021}, volume = {211}, pages = {103252}, issn = {1077-3142}, doi = {https://doi.org/10.1016/j.cviu.2021.103252}, url = {https://www.sciencedirect.com/science/article/pii/S1077314221000965}, journal={Computer Vision and Image Understanding}, pdf={https://arxiv.org/pdf/2107.13411.pdf} }
@inproceedings{furnari2022towards, year = {2022}, booktitle = { International Conference on Pattern Recognition (ICPR) }, title = { Towards Streaming Egocentric Action Anticipation }, pdf = { https://arxiv.org/pdf/2110.05386.pdf }, author = { Antonino Furnari and Giovanni Maria Farinella } }
@article{furnari2023streaming, doi = {https://doi.org/10.1016/j.cviu.2023.103763}, pdf = {https://arxiv.org/pdf/2306.16682.pdf}, url = {https://www.sciencedirect.com/science/article/pii/S1077314223001431?via%3Dihub}, year = {2023}, title = {Streaming egocentric action anticipation: an evaluation scheme and approach}, journal = {Computer Vision and Image Understanding (CVIU)}, author = {Antonino Furnari and Giovanni Maria Farinella}, }
@article{damen2020epic, author = {Dima Damen and Hazel Doughty and Giovanni Maria Farinella and Sanja Fidler and Antonino Furnari and Evangelos Kazakos and Davide Moltisanti and Jonathan Munro and Toby Perrett and Will Price and Michael Wray}, journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence (PAMI)}, title = {The EPIC-KITCHENS Dataset: Collection, Challenges and Baselines}, url = {https://epic-kitchens.github.io/}, pdf = {https://arxiv.org/pdf/2005.00343.pdf}, year = {2020}, doi = {10.1109/TPAMI.2020.2991965} }
@inproceedings{Damen2018EPICKITCHENS, year = {2018}, booktitle= { European Conference on Computer Vision }, author = { D. Damen and H. Doughty and G. M. Farinella and S. Fidler and A. Furnari and E. Kazakos and D. Moltisanti and J. Munro and T. Perrett and W. Price and M. Wray }, title = { Scaling Egocentric Vision: The EPIC-KITCHENS Dataset }, url={https://epic-kitchens.github.io/2018}, pdf={https://arxiv.org/pdf/1804.02748.pdf} }
@article{ragusa2020egoch, title = {EGO-CH: Dataset and Fundamental Tasks for Visitors Behavioral Understanding using Egocentric Vision}, journal = {Pattern Recognition Letters - Special Issue on Pattern Recognition and Artificial Intelligence Techniques for Cultural Heritage}, year = {2020}, pdf = {https://www.antoninofurnari.it/downloads/publications/ragusa2020egoch.pdf}, url = {https://iplab.dmi.unict.it/EGO-CH/}, author = {F. Ragusa and A. Furnari and S. Battiato and G. Signorello and G. M. Farinella}, }
@article{orlando2020egocentric, author = {S. Orlando and A. Furnari and G. M. Farinella}, url = {https://iplab.dmi.unict.it/SimulatedEgocentricNavigations/}, pdf = {https://www.antoninofurnari.it/downloads/publications/orlando2020egocentric.pdf}, year = {2020}, journal = {Pattern Recognition Letters - Special Issue on Pattern Recognition and Artificial Intelligence Techniques for Cultural Heritage}, title = {Egocentric Visitor Localization and Artwork Detection inCultural Sites Using Synthetic Data}, }
@article{milotta2019egocentric, pdf = {https://www.antoninofurnari.it/downloads/publications/milotta2019egocentric.pdf}, author = {Filippo L.M. Milotta and Antonino Furnari and Sebastiano Battiato and Giovanni Signorello and Giovanni M. Farinella}, url = {https://iplab.dmi.unict.it/EgoNature/}, doi = {https://doi.org/10.1016/j.jvcir.2019.102664}, issn = {1047-3203}, year = {2019}, pages = {102664}, journal = {Journal of Visual Communication and Image Representation}, title = {Egocentric Visitors Localization in Natural Sites}, }
@article{ragusa2019egocentric, author = {F. Ragusa and A. Furnari and S. Battiato and G. Signorello and G. M. Farinella}, url = {http://iplab.dmi.unict.it/VEDI/}, pdf = {https://arxiv.org/pdf/1904.05264.pdf}, year = {2019}, journal = {Journal on Computing and Cultural Heritage (JOCCH)}, title = {Egocentric Visitors Localization in Cultural Sites}, volume = {12}, issue = {2}, doi = {https://doi.org/10.1145/3276772} }
@article{furnari2020rulstm, author = {Antonino Furnari and Giovanni Maria Farinella}, journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence (PAMI)}, title = {Rolling-Unrolling LSTMs for Action Anticipation from First-Person Video}, url = {https://iplab.dmi.unict.it/rulstm}, pdf = {https://arxiv.org/pdf/2005.02190.pdf}, year = {2020}, doi = {10.1109/TPAMI.2020.2992889} }
@inproceedings{furnari2019rulstm, title = { What Would You Expect? Anticipating Egocentric Actions with Rolling-Unrolling LSTMs and Modality Attention }, author = { Antonino Furnari and Giovanni Maria Farinella }, year = { 2019 }, booktitle = { International Conference on Computer Vision }, pdf = {https://arxiv.org/pdf/1905.09035.pdf}, url = {http://iplab.dmi.unict.it/rulstm} }
@inproceedings{furnari2018Leveraging, author = { A. Furnari and S. Battiato and G. M. Farinella }, title = { Leveraging Uncertainty to Rethink Loss Functions and Evaluation Measures for Egocentric Action Anticipation }, booktitle = { International Workshop on Egocentric Perception, Interaction and Computing (EPIC) in conjunction with ECCV }, pdf = { ../publications/furnari2018Leveraging.pdf }, url = {https://github.com/fpv-iplab/action-anticipation-losses/}, year = { 2018 }, }
@article{furnari2017next, title = { Next-active-object prediction from egocentric videos }, journal = { Journal of Visual Communication and Image Representation }, volume = { 49 }, number = { Supplement C }, pages = { 401 - 411 }, year = { 2017 }, issn = { 1047-3203 }, doi = { https://doi.org/10.1016/j.jvcir.2017.10.004 }, url = { http://iplab.dmi.unict.it/NextActiveObjectPrediction/ }, pdf = {https://www.antoninofurnari.it/downloads/publications/furnari2017next.pdf}, author = { Antonino Furnari and Sebastiano Battiato and Kristen Grauman and Giovanni Maria Farinella }, }
@article{furnari2018personal, pages = { 1-12 }, volume = { 52 }, doi = { https://doi.org/10.1016/j.jvcir.2018.01.019 }, issn = { 1047-3203 }, author = { Antonino Furnari and Sebastiano Battiato and Giovanni Maria Farinella }, url = { http://iplab.dmi.unict.it/PersonalLocationSegmentation/ }, pdf = { ../publications/furnari2018personal.pdf }, year = { 2018 }, journal = { Journal of Visual Communication and Image Representation }, title = { Personal-Location-Based Temporal Segmentation of Egocentric Video for Lifelogging Applications }, }
@inproceedings{furnari2016temporal, url = { http://iplab.dmi.unict.it/PersonalLocationSegmentation/ }, pdf = { ../publications/furnari2016temporal.pdf }, year = { 2016 }, publisher = { Springer Lecture Notes in Computer Science }, series = { Lecture Notes in Computer Science }, volume = { 9913 }, pages = { 474--489 }, booktitle = { International Workshop on Egocentric Perception, Interaction and Computing (EPIC) in conjunction with ECCV, The Netherlands, Amsterdam, October 9 }, title = { Temporal Segmentation of Egocentric Videos to Highlight Personal Locations of Interest }, author = { Antonino Furnari and Giovanni Maria Farinella and Sebastiano Battiato }, }
@article{furnari2016recognizing, author={Furnari, Antonino and Farinella, Giovanni Maria and Battiato, Sebastiano}, journal={IEEE Transactions on Human-Machine Systems}, title={Recognizing Personal Locations From Egocentric Videos}, year={2016}, doi={10.1109/THMS.2016.2612002}, ISSN={2168-2291}, url={http://iplab.dmi.unict.it/PersonalLocations/}, pdf={../publications/furnari2016recognizing.pdf} }
@inproceedings{furnari2015recognizing, url = { http://iplab.dmi.unict.it/PersonalLocations/ }, pdf = { ../publications/furnari2015recognizing.pdf }, year = { 2015 }, booktitle = { Workshop on Assistive Computer Vision and Robotics (ACVR) in conjunction with ICCV, Santiago, Chile, December 12 }, page = { 393--401 }, title = { Recognizing Personal Contexts from Egocentric Images }, author = { Antonino Furnari and Giovanni Maria Farinella and Sebastiano Battiato }, }