In this project, we deal with a central challenge that is to make egocentric videos watchable. First person videos are generally long-running streams with unedited content, which make them boring and visually unpalatable. Efforts have been applied to try to accelerate them while maintaining the suavity since the naive fast-forwarding amplifies the natural motion of the recorder’s body turning the video nauseate. In this project, we tackle this challenge by an adaptive frame sampling based on the semantic information extracted from images.
Publications
[TPAMI 2023] Washington Ramos, Michel Silva, Edson Araujo, Victor Moura, Keller Oliveira, Leandro Soriano Marcolino, Erickson R. Nascimento. Text-Driven Video Acceleration: A Weakly-Supervised Reinforcement Learning Method, IEEE Transactions on Pattern Analysis and Machine Intelligence (TPAMI), 2023. Visit the page for the code and paper access.
@ARTICLE{Ramos2023tpami,
author={Ramos, Washington and Silva, Michel and Araujo, Edson and Moura, Victor and Oliveira, Keller and Marcolino, Leandro Soriano and Nascimento, Erickson R.},
journal={IEEE Transactions on Pattern Analysis and Machine Intelligence},
title={Text-Driven Video Acceleration: A Weakly-Supervised Reinforcement Learning Method},
year={2023},
volume={45},
number={2},
pages={2492-2504},
doi={10.1109/TPAMI.2022.3157198}
}
[SIBGRAPI 2021] Diognei de Matos, Washington Ramos, Luiz Romanhol, Erickson R. Nascimento. Musical Hyperlapse: A Multimodal Approach to Accelerate First-Person Videos, 2021 34th SIBGRAPI Conference on Graphics, Patterns and Images (SIBGRAPI), 2021. Visit the page for the code and paper access.
@INPROCEEDINGS{Matos2021sibgrapi,
author = {de Matos, Diognei and Ramos, Washington and Romanhol, Luiz and Nascimento, Erickson R.},
booktitle = {2021 34th SIBGRAPI Conference on Graphics, Patterns and Images (SIBGRAPI)},
title = {Musical Hyperlapse: A Multimodal Approach to Accelerate First-Person Videos},
year = {2021},
volume = {},
number = {},
pages = {184-191},
doi = {10.1109/SIBGRAPI54419.2021.00033}
}
[TPAMI 2021] Michel M. Silva, Washington L. S. Ramos, Mario F. M. Campos, Erickson R. Nascimento. A Sparse Sampling-based framework for Semantic Fast-Forward of First-Person Videos, IEEE Transactions on Pattern Analysis and Machine Intelligence (TPAMI), 2021. Visit the page for the code and paper access.
@ARTICLE{Silva2021tpami,
author = {M. {Silva} and W. {Ramos} and M. {Campos} and E. R. {Nascimento}},
journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence},
title = {A Sparse Sampling-based framework for Semantic Fast-Forward of First-Person Videos},
year = {2021},
volume = {43},
number = {4},
pages = {1438-1444},
doi = {10.1109/TPAMI.2020.2983929},
ISBN = {0162-8828}
}
[CVPRW 2020] Alan Neves, Michel Silva, Mario Campos, Erickson R. Nascimento. A gaze driven fast-forward method for first-person videos, Sixth International Workshop on Egocentric Perception, Interaction and Computing at the IEEE/CVF Conference on Computer Vision and Pattern Recognition (EPIC@CVPR), 2020. Visit the page for the code and paper access.
@InProceedings{Neves2020epic@cvpr,
title = {A gaze driven fast-forward method for first-person videos},
booktitle = {Sixth International Workshop on Egocentric Perception, Interaction and Computing at the IEEE/CVF Conference on Computer Vision and Pattern Recognition (EPIC@CVPR)},
author = {Alan Neves, Michel Silva, Mario Campos, Erickson R. Nascimento},
Year = {2020},
month = {Jun.},
pages = {1-4}
}
[CVPR 2020] Washington L. S. Ramos, Michel M. Silva, Edson R. Araujo, Leandro S. Marcolino, Erickson R. Nascimento. Straight to the Point: Fast-forwarding Videos via Reinforcement Learning Using Textual Data, IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR), 2020. Visit the page for the code and paper access.
@InProceedings{Ramos2020cvpr,
author={W. {Ramos} and M. {Silva} and E. {Araujo} and L. S. {Marcolino} and E. {Nascimento}},
booktitle={2020 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)},
title={Straight to the Point: Fast-Forwarding Videos via Reinforcement Learning Using Textual Data},
year={2020},
volume={},
number={},
pages={10928-10937},
}
[WACV 2020] Washington L. S. Ramos, Michel M. Silva, Edson R. Araujo, Alan C. Neves, Erickson R. Nascimento. Personalizing Fast-Forward Videos Based on Visual and Textual Features from Social Network, IEEE Winter Conference on Applications of Computer Vision (WACV), 2020. Visit the page for the code and paper access.
@INPROCEEDINGS{Ramos2020WACV,
author={W. L. S. {Ramos} and M. M. {Silva} and E. R. {Araujo} and A. C. {Neves} and E. R. {Nascimento}},
booktitle={2020 IEEE Winter Conference on Applications of Computer Vision (WACV)},
title={Personalizing Fast-Forward Videos Based on Visual and Textual Features from Social Network},
year={2020},
volume={},
number={},
pages={3260-3269},}
[CVPRW 2018] Vinicius S. Furlan, Ruzena Bajcsy, Erickson R. Nascimento. Fast forwarding Egocentric Videos by Listening and Watching, IEEE Conference on Computer Vision and Pattern Recognition Sight and Sound Workshop (CVPRW), 2018. Visit the page for more information.
@InProceedings{furlan2018cvprw,
author = {Vinicius S. Furlan and Ruzena Bajcsy and Erickson R. Nascimento},
title = {Fast forwarding Egocentric Videos by Listening and Watching},
booktitle = {In IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshop on Sight and Sound},
pages = {2504–2507},
publisher = {{IEEE} Computer Society},
year = {2018} }
[JVCI 2018] Michel M. Silva, Washington L. S. Ramos, Felipe C. Chamone, Joao P. K. Ferreira, Mario F. M. Campos, Erickson R. Nascimento. Making a long story short: A Multi-Importance fast-forwarding egocentric videos with the emphasis on relevant objects, Journal of Visual Communication and Image Representation (JVCI), 2018. Visit the page for more information and paper access.
@article{Silva2018,
title = {Making a long story short: A Multi-Importance fast-forwarding egocentric videos with the emphasis on relevant objects},
author = {Michel M. Silva and Washington L. S. Ramos and Felipe C. Chamone and João P. K. Ferreira and Mario F. M. Campos and Erickson R. Nascimento},
journal = {Journal of Visual Communication and Image Representation},
volume = {53},
number = {},
pages = {55 – 64},
year = {2018},
issn = {1047-3203},
doi = {10.1016/j.jvcir.2018.02.013}
}
[CVPR 2018] Michel M. Silva, Washington L. S. Ramos, Joao P. K. Ferreira, Felipe C. Chamone, Mario F. M. Campos, Erickson R. Nascimento. A Weighted Sparse Sampling and Smoothing Frame Transition Approach for Semantic Fast-Forward First-Person Videos, IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2018. Visit the page for more information and paper access.
@InProceedings{Silva2018,
title = {A Weighted Sparse Sampling and Smoothing Frame Transition Approach for Semantic Fast-Forward First-Person Videos},
booktitle = {2018 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)},
author = {Silva, Michel and Ramos, Washington and Ferreira, João and Chamone, Felipe and Campos, Mario and Nascimento, Erickson R.},
Year = {2018},
Address = {Salt Lake City, USA},
month = {Jun.},
pages = {2383-2392},
doi = {10.1109/CVPR.2018.00253},
ISBN = {978-1-5386-6420-9}
}
[EPIC 2016] Michel M. Silva, Washington L. S. Ramos, Joao P. K. Ferreira, Mario F. M. Campos, Erickson R. Nascimento. Towards Semantic Fast-Forward and Stabilized Egocentric Videos, First International Workshop on Egocentric Perception, Interaction, and Computing at European Conference on Computer Vision (EPIC@ECCV), 2016. Visit the page for the code and paper access.
@InBook{Silva2016,
Title = {Towards Semantic Fast-Forward and Stabilized Egocentric Videos},
Booktitle = {International Workshop on Egocentric Perception, Interaction and Computing (EPIC) at European Conference on Computer Vsision (ECCV)},
Author = {Silva, Michel Melo and Ramos, Washington Luis Souza and Ferreira, Joao Pedro Klock and Campos, Mario Fernando Montenegro and
Nascimento, Erickson Rangel},
Year = {2016},
Address = {Amsterdam, NL},
month = {Oct.},
Pages = {557–571},
Doi = {10.1007/978-3-319-46604-0_40},
ISBN = {978-3-319-46604-0}
}
[ICIP 2016] Washington L. S. Ramos, Michel M. Silva, Mario F. M. Campos, Erickson R. Nascimento. Fast-Forward Video Based on Semantic Extraction, IEEE International Conference on Image Processing (ICIP), 2016. Visit the page for the code and paper access.
@InProceedings{Ramos2016,
author = {W. L. S. Ramos and M. M. Silva and M. F. M. Campos and E. R. Nascimento},
booktitle = {IEEE International Conference on Image Processing (ICIP)},
title = {Fast-forward video based on semantic extraction},
year = {2016},
month = {Sep.},
address = {Phoenix, USA},
pages = {3334-3338},
doi = {10.1109/ICIP.2016.7532977}
}