Skip to main content
Menu

Publications

Showing 50 publications by João Henriques

A sound approach: using large language models to generate audio descriptions for egocentric text-audio retrieval

Oncescu A-M, Henriques JF, Zisserman A, Albanie S & Koepke AS (2024), Proceedings of the 49th IEEE International Conference on Acoustics, Speech, & Signal Processing (ICASSP 2024), 7300-7304

BibTeX View PDF
@inproceedings{asoundapproachu-2024/4,
  title={A sound approach: using large language models to generate audio descriptions for egocentric text-audio retrieval},
  author={Oncescu A-M, Henriques JF, Zisserman A, Albanie S & Koepke AS},
  booktitle={49th IEEE International Conference on Acoustics, Speech, & Signal Processing (ICASSP 2024)},
  pages={7300-7304},
  year = "2024"
}

N2F2: Hierarchical Scene Understanding with Nested Neural Feature Fields

Bhalgat Y, Laina I, Henriques JF, Zisserman A & Vedaldi A (2024)

BibTeX View PDF
@misc{nfhierarchicals-2024/3,
  title={N2F2: Hierarchical Scene Understanding with Nested Neural Feature Fields},
  author={Bhalgat Y, Laina I, Henriques JF, Zisserman A & Vedaldi A},
  year = "2024"
}

SCENES: Subpixel Correspondence EstimationWith Epipolar Supervision

Kloepfer DA, Henriques JF & Campbell D (2024), 00, 21-30

BibTeX View PDF
@inproceedings{scenessubpixelc-2024/3,
  title={SCENES: Subpixel Correspondence EstimationWith Epipolar Supervision},
  author={Kloepfer DA, Henriques JF & Campbell D},
  booktitle={2024 International Conference on 3D Vision (3DV)},
  pages={21-30},
  year = "2024"
}

Select to perfect: imitating desired behavior from large multi-agent data

Franzmeyer T, Elkind E, Torr P, Foerster J & Henriques JF (2024), Proceedings of the 12th International Conference on Learning Representations (ICLR 2024)

BibTeX
@inproceedings{selecttoperfect-2024/1,
  title={Select to perfect: imitating desired behavior from large multi-agent data},
  author={Franzmeyer T, Elkind E, Torr P, Foerster J & Henriques JF},
  booktitle={12th International Conference on Learning Representations (ICLR 2024)},
  year = "2024"
}

LoCUS: Learning Multiscale 3D-consistent Features from Posed Images

Kloepfer DA, Campbell D & Henriques JF (2023), 00, 16588-16598

BibTeX View PDF
@inproceedings{locuslearningmu-2023/10,
  title={LoCUS: Learning Multiscale 3D-consistent Features from Posed Images},
  author={Kloepfer DA, Campbell D & Henriques JF},
  booktitle={2023 IEEE/CVF International Conference on Computer Vision (ICCV)},
  pages={16588-16598},
  year = "2023"
}

CASSPR: Cross Attention Single Scan Place Recognition

Xia Y, Gladkova M, Wang R, Li Q, Stilla U et al. (2023), 00, 8427-8438

BibTeX View PDF
@inproceedings{cassprcrossatte-2023/10,
  title={CASSPR: Cross Attention Single Scan Place Recognition},
  author={Xia Y, Gladkova M, Wang R, Li Q, Stilla U et al.},
  booktitle={2023 IEEE/CVF International Conference on Computer Vision (ICCV)},
  pages={8427-8438},
  year = "2023"
}

RbA: Segmenting Unknown Regions Rejected by All

Nayal N, Yavuz M, Henriques JF & Güney F (2023), 00, 711-722

BibTeX View PDF
@inproceedings{rbasegmentingun-2023/10,
  title={RbA: Segmenting Unknown Regions Rejected by All},
  author={Nayal N, Yavuz M, Henriques JF & Güney F},
  booktitle={2023 IEEE/CVF International Conference on Computer Vision (ICCV)},
  pages={711-722},
  year = "2023"
}

A light touch approach to teaching transformers multi-view geometry

Bhalgat Y, Henriques J & Zisserman A (2023), Proceedings of the Conference on Computer Vision and Pattern Recognition (CVPR 2023), 4958-4969

BibTeX View PDF
@inproceedings{alighttouchappr-2023/8,
  title={A light touch approach to teaching transformers multi-view geometry},
  author={Bhalgat Y, Henriques J & Zisserman A},
  booktitle={Conference on Computer Vision and Pattern Recognition (CVPR 2023)},
  pages={4958-4969},
  year = "2023"
}

Contrastive Lift: 3D Object Instance Segmentation by Slow-Fast Contrastive Fusion

Bhalgat Y, Laina I, Henriques JF, Zisserman A & Vedaldi A (2023)

BibTeX View PDF
@misc{contrastivelift-2023/6,
  title={Contrastive Lift: 3D Object Instance Segmentation by Slow-Fast Contrastive Fusion},
  author={Bhalgat Y, Laina I, Henriques JF, Zisserman A & Vedaldi A},
  year = "2023"
}

Learn what matters: cross-domain imitation learning with task-relevant embeddings

Franzmeyer T, Torr P & Henriques J (2023), Advances in Neural Information Processing Systems 35 (NeurIPS 2022), 35

BibTeX
@inproceedings{learnwhatmatter-2023/4,
  title={Learn what matters: cross-domain imitation learning with task-relevant embeddings},
  author={Franzmeyer T, Torr P & Henriques J},
  booktitle={36th Annual Conference on Neural Information Processing Systems (NeurIPS 2022)},
  year = "2023"
}

Towards Solving Fuzzy Tasks with Human Feedback: A Retrospective of the MineRL BASALT 2022 Competition

Milani S, Kanervisto A, Ramanauskas K, Schulhoff S, Houghton B et al. (2023), Proceedings of Machine Learning Research, 220, 171-188

BibTeX
@inproceedings{towardssolvingf-2023/1,
  title={Towards Solving Fuzzy Tasks with Human Feedback: A Retrospective of the MineRL BASALT 2022 Competition},
  author={Milani S, Kanervisto A, Ramanauskas K, Schulhoff S, Houghton B et al.},
  pages={171-188},
  year = "2023"
}

SNeS: learning probably symmetric neural surfaces from incomplete data

Insafutdinov E, Campbell D & Vedaldi A (2022)

BibTeX View PDF
@inproceedings{sneslearningpro-2022/11,
  title={SNeS: learning probably symmetric neural surfaces from incomplete data},
  author={Insafutdinov E, Campbell D & Vedaldi A},
  booktitle={European Conference on Computer Vision 2022},
  year = "2022"
}

RbA: Segmenting Unknown Regions Rejected by All

Nayal N, Yavuz M, Henriques JF & Güney F (2022)

BibTeX View PDF
@misc{rbasegmentingun-2022/11,
  title={RbA: Segmenting Unknown Regions Rejected by All},
  author={Nayal N, Yavuz M, Henriques JF & Güney F},
  year = "2022"
}

Towards real-world navigation with deep differentiable planners

Ishida S & Henriques JF (2022), Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR 2022), 17306-17315

BibTeX View PDF
@inproceedings{towardsrealworl-2022/9,
  title={Towards real-world navigation with deep differentiable planners},
  author={Ishida S & Henriques JF},
  booktitle={IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR 2022)},
  pages={17306-17315},
  year = "2022"
}

Towards real-world navigation with deep differentiable planners

Ishida S & Henriques JF (2022), Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR 2022), 17306-17315

BibTeX View PDF
@inproceedings{towardsrealworl-2022/9,
  title={Towards real-world navigation with deep differentiable planners},
  author={Ishida S & Henriques JF},
  booktitle={IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR 2022)},
  pages={17306-17315},
  year = "2022"
}

SNeS: Learning Probably Symmetric Neural Surfaces from Incomplete Data

Insafutdinov E, Campbell D, Henriques JF & Vedaldi A (2022)

BibTeX View PDF
@misc{sneslearningpro-2022/6,
  title={SNeS: Learning Probably Symmetric Neural Surfaces from Incomplete Data},
  author={Insafutdinov E, Campbell D, Henriques JF & Vedaldi A},
  year = "2022"
}

Learning altruistic behaviours in reinforcement learning without external rewards

Franzmeyer T, Malinowski M & Henriques JF (2022)

BibTeX
@inproceedings{learningaltruis-2022/4,
  title={Learning altruistic behaviours in reinforcement learning without external rewards},
  author={Franzmeyer T, Malinowski M & Henriques JF},
  booktitle={10th International Conference on Learning Representations (ICLR 2022)},
  year = "2022"
}

Learning altruistic behaviours in reinforcement learning without external rewards

Franzmeyer T, Malinowski M & Henriques JF (2022)

BibTeX
@inproceedings{learningaltruis-2022/4,
  title={Learning altruistic behaviours in reinforcement learning without external rewards},
  author={Franzmeyer T, Malinowski M & Henriques JF},
  booktitle={10th International Conference on Learning Representations (ICLR 2022)},
  year = "2022"
}

Space-Time Crop & Attend: improving cross-modal video representation learning

Patrick M, Huang P-Y, Misra I, Metze F, Vedaldi A et al. (2022), 2021 IEEE/CVF International Conference on Computer Vision (ICCV), 10540-10552

BibTeX View PDF
@inproceedings{spacetimecropat-2022/2,
  title={Space-Time Crop & Attend: improving cross-modal video representation learning},
  author={Patrick M, Huang P-Y, Misra I, Metze F, Vedaldi A et al.},
  booktitle={2021 IEEE/CVF International Conference on Computer Vision (ICCV)},
  pages={10540-10552},
  year = "2022"
}

On compositions of transformations in contrastive self-supervised learning

Yuki M. Asano Y, Patrick M, Kuznetsova P, Fong R, Henriques J et al. (2022), Proceedings of the 2021 IEEE/CVF International Conference on Computer Vision (ICCV 2021), 9557-9567

BibTeX View PDF
@inproceedings{oncompositionso-2022/2,
  title={On compositions of transformations in contrastive self-supervised learning},
  author={Yuki M. Asano Y, Patrick M, Kuznetsova P, Fong R, Henriques J et al.},
  booktitle={2021 IEEE/CVF International Conference on Computer Vision (ICCV 2021)},
  pages={9557-9567},
  year = "2022"
}

Preface

Albanie S, Henriques JF, Bertinetto L, Hernández-García A, Doughty H et al. (2022), Proceedings of Machine Learning Research, 181

BibTeX
@article{preface-2022/1,
  title={Preface},
  author={Albanie S, Henriques JF, Bertinetto L, Hernández-García A, Doughty H et al.},
  journal={Proceedings of Machine Learning Research},
  volume={181},
  year = "2022"
}

Keeping your eye on the ball: Trajectory attention in video transformers

Patrick M, Campbell D, Asano Y, Misra I, Metze F et al. (2021), Advances in Neural Information Processing Systems 34, 34, 12493-12506

BibTeX
@inproceedings{keepingyoureyeo-2021/12,
  title={Keeping your eye on the ball: Trajectory attention in video transformers},
  author={Patrick M, Campbell D, Asano Y, Misra I, Metze F et al.},
  booktitle={35th Conference on Neural Information Processing Systems (NeurIPS 2021)},
  pages={12493-12506},
  year = "2021"
}

Moving SLAM: fully unsupervised deep learning in non-rigid scenes

Xu D, Vedaldi A & Henriques JF (2021), Proceedings of the IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS 2021), 4611-4617

BibTeX View PDF
@inproceedings{movingslamfully-2021/9,
  title={Moving SLAM: fully unsupervised deep learning in non-rigid scenes},
  author={Xu D, Vedaldi A & Henriques JF},
  booktitle={IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS 2021)},
  pages={4611-4617},
  year = "2021"
}

Audio retrieval with natural language queries

Oncescu A-M, Koepke AS, Henriques J, Akata Z & Albanie S (2021), Proceedings of Interspeech 2021, 2411-2415

BibTeX View PDF
@inproceedings{audioretrievalw-2021/8,
  title={Audio retrieval with natural language queries},
  author={Oncescu A-M, Koepke AS, Henriques J, Akata Z & Albanie S},
  booktitle={Interspeech 2021},
  pages={2411-2415},
  year = "2021"
}

Keeping Your Eye on the Ball: Trajectory Attention in Video Transformers

Patrick M, Campbell D, Asano YM, Misra I, Metze F et al. (2021)

BibTeX View PDF
@misc{keepingyoureyeo-2021/6,
  title={Keeping Your Eye on the Ball: Trajectory Attention in Video Transformers},
  author={Patrick M, Campbell D, Asano YM, Misra I, Metze F et al.},
  year = "2021"
}

QUERYD: a video dataset with high-quality text and audio narrations

Oncescu A-M, Henriques J, Liu Y, Zisserman A & Albanie S (2021), ICASSP 2021 - 2021 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), 2265-2269

BibTeX View PDF
@inproceedings{querydavideodat-2021/5,
  title={QUERYD: a video dataset with high-quality text and audio narrations},
  author={Oncescu A-M, Henriques J, Liu Y, Zisserman A & Albanie S},
  booktitle={2021 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP 2021)},
  pages={2265-2269},
  year = "2021"
}

Support-set bottlenecks for video-text representation learning

Patrick M, Huang P, Asano Y, Metze F, Hauptmann A et al. (2021)

BibTeX
@inproceedings{supportsetbottl-2021/5,
  title={Support-set bottlenecks for video-text representation learning},
  author={Patrick M, Huang P, Asano Y, Metze F, Hauptmann A et al.},
  booktitle={9th International Conference on Learning Representations (ICLR 2021)},
  year = "2021"
}

Moving SLAM: Fully Unsupervised Deep Learning in Non-Rigid Scenes

Xu D, Vedaldi A & Henriques JF (2021)

BibTeX View PDF
@misc{movingslamfully-2021/5,
  title={Moving SLAM: Fully Unsupervised Deep Learning in Non-Rigid Scenes},
  author={Xu D, Vedaldi A & Henriques JF},
  year = "2021"
}

Space-Time Crop & Attend: Improving Cross-modal Video Representation Learning

Patrick M, Asano YM, Huang B, Misra I, Metze F et al. (2021)

BibTeX View PDF
@misc{spacetimecropat-2021/3,
  title={Space-Time Crop & Attend: Improving Cross-modal Video Representation Learning},
  author={Patrick M, Asano YM, Huang B, Misra I, Metze F et al.},
  year = "2021"
}

Preface

Bertinetto L, Henriques JF, Albanie S, Paganini M & Varol G (2021), Proceedings of Machine Learning Research, 148, I

BibTeX
@article{preface-2021/1,
  title={Preface},
  author={Bertinetto L, Henriques JF, Albanie S, Paganini M & Varol G},
  journal={Proceedings of Machine Learning Research},
  volume={148},
  pages={I},
  year = "2021"
}

Quantised Transforming Auto-Encoders: Achieving Equivariance to Arbitrary Transformations in Deep Networks

Jiao J & Henriques JF (2021), 32nd British Machine Vision Conference, BMVC 2021

BibTeX
@inproceedings{quantisedtransf-2021/1,
  title={Quantised Transforming Auto-Encoders: Achieving Equivariance to Arbitrary Transformations in Deep Networks},
  author={Jiao J & Henriques JF},
  year = "2021"
}

Gradient Shape Model

Martins P, Henriques JF & Batista J (2020), International Journal of Computer Vision, 128(12), 2828-2848

BibTeX View PDF
@article{gradientshapemo-2020/12,
  title={Gradient Shape Model},
  author={Martins P, Henriques JF & Batista J},
  journal={International Journal of Computer Vision},
  volume={128},
  pages={2828-2848},
  publisher={Springer Nature},
  year = "2020"
}

Support-set bottlenecks for video-text representation learning

Patrick M, Huang P-Y, Asano Y, Metze F, Hauptmann A et al. (2020)

BibTeX View PDF
@misc{supportsetbottl-2020/10,
  title={Support-set bottlenecks for video-text representation learning},
  author={Patrick M, Huang P-Y, Asano Y, Metze F, Hauptmann A et al.},
  year = "2020"
}

Automatic Recall Machines: Internal Replay, Continual Learning and the Brain

Ji X, Henriques J, Tuytelaars T & Vedaldi A (2020)

BibTeX View PDF
@misc{automaticrecall-2020/6,
  title={Automatic Recall Machines: Internal Replay, Continual Learning and the Brain},
  author={Ji X, Henriques J, Tuytelaars T & Vedaldi A},
  year = "2020"
}

On Compositions of Transformations in Contrastive Self-Supervised Learning

Patrick M, Asano YM, Kuznetsova P, Fong R, Henriques JF et al. (2020)

BibTeX View PDF
@misc{oncompositionso-2020/3,
  title={On Compositions of Transformations in Contrastive Self-Supervised Learning},
  author={Patrick M, Asano YM, Kuznetsova P, Fong R, Henriques JF et al.},
  year = "2020"
}

Small steps and giant leaps: minimal newton solvers for deep learning

Henriques J, Ehrhardt S, Albanie S & Vedaldi A (2020), Proceedings of the International Conference on Computer Vision 2019

BibTeX View PDF
@inproceedings{smallstepsandgi-2020/2,
  title={Small steps and giant leaps: minimal newton solvers for deep learning},
  author={Henriques J, Ehrhardt S, Albanie S & Vedaldi A},
  booktitle={2019 IEEE/CVF International Conference on Computer Vision (ICCV)},
  year = "2020"
}

Invariant information clustering for unsupervised image classification and segmentation

Ji X, Henriques JF & Vedaldi A (2020), 2019 IEEE/CVF International Conference on Computer Vision (ICCV), 9864-9873

BibTeX View PDF
@inproceedings{invariantinform-2020/2,
  title={Invariant information clustering for unsupervised image classification and segmentation},
  author={Ji X, Henriques JF & Vedaldi A},
  booktitle={International Conference on Computer Vision (ICCV)},
  pages={9864-9873},
  year = "2020"
}

360 Camera Alignment via Segmentation

Davidson B, Alvi MS & Henriques JF (2020), 12373, 579-595

BibTeX View PDF
@inproceedings{cameraalignment-2020/,
  title={360 Camera Alignment via Segmentation},
  author={Davidson B, Alvi MS & Henriques JF},
  pages={579-595},
  year = "2020"
}

Meta-learning with differentiable closed-form solvers

Bertinetto L, Henriques J, Torr P & Vedaldi A (2019), Proceedings of the International Conference on Learning Representations (ICLR 2019)

BibTeX
@inproceedings{metalearningwit-2019/2,
  title={Meta-learning with differentiable closed-form solvers},
  author={Bertinetto L, Henriques J, Torr P & Vedaldi A},
  booktitle={7th International Conference on Learning Representations (ICLR 2019)},
  year = "2019"
}

The sixth visual object tracking VOT2018 challenge results

Kristan M, Leonardis A, Matas J, Vedaldi A, Henriques J et al. (2019), ECCV 2018: Computer Vision – ECCV 2018 Workshops, 11129, 3-53

BibTeX View PDF
@inproceedings{thesixthvisualo-2019/1,
  title={The sixth visual object tracking VOT2018 challenge results},
  author={Kristan M, Leonardis A, Matas J, Vedaldi A, Henriques J et al.},
  pages={3-53},
  year = "2019"
}

Meta-learning with differentiable closed-form solvers

Henriques J, Torr P, Warren C & Vedaldi P (2019), 7th International Conference on Learning Representations, ICLR 2019

BibTeX
@inproceedings{metalearningwit-2019/1,
  title={Meta-learning with differentiable closed-form solvers},
  author={Henriques J, Torr P, Warren C & Vedaldi P},
  year = "2019"
}

MapNet: An allocentric spatial memory for mapping environments

Henriques JF & Vedaldi A (2018), Conference on Computer Vision and Pattern Recognition (CVPR 2018)

BibTeX View PDF
@inproceedings{mapnetanallocen-2018/12,
  title={MapNet: An allocentric spatial memory for mapping environments},
  author={Henriques JF & Vedaldi A},
  year = "2018"
}

Long-term tracking in the wild: a benchmark

Valmadre J, Bertinetto L, Henriques JF, Tao R, Vedaldi A et al. (2018), ECCV 2018: Computer Vision – ECCV 2018, 11207, 692-707

BibTeX View PDF
@inproceedings{longtermtrackin-2018/10,
  title={Long-term tracking in the wild: a benchmark},
  author={Valmadre J, Bertinetto L, Henriques JF, Tao R, Vedaldi A et al.},
  pages={692-707},
  year = "2018"
}

Invariant Information Clustering for Unsupervised Image Classification and Segmentation

Ji X, Henriques JF & Vedaldi A (2018)

BibTeX View PDF
@misc{invariantinform-2018/7,
  title={Invariant Information Clustering for Unsupervised Image Classification and Segmentation},
  author={Ji X, Henriques JF & Vedaldi A},
  year = "2018"
}

Small steps and giant leaps: Minimal Newton solvers for Deep Learning

Henriques JF, Ehrhardt S, Albanie S & Vedaldi A (2018)

BibTeX View PDF
@misc{smallstepsandgi-2018/5,
  title={Small steps and giant leaps: Minimal Newton solvers for Deep Learning},
  author={Henriques JF, Ehrhardt S, Albanie S & Vedaldi A},
  year = "2018"
}

Meta-learning with differentiable closed-form solvers

Bertinetto L, Henriques JF, Torr PHS & Vedaldi A (2018)

BibTeX View PDF
@misc{metalearningwit-2018/5,
  title={Meta-learning with differentiable closed-form solvers},
  author={Bertinetto L, Henriques JF, Torr PHS & Vedaldi A},
  year = "2018"
}

Long-term Tracking in the Wild: A Benchmark

Valmadre J, Bertinetto L, Henriques JF, Tao R, Vedaldi A et al. (2018)

BibTeX View PDF
@misc{longtermtrackin-2018/3,
  title={Long-term Tracking in the Wild: A Benchmark},
  author={Valmadre J, Bertinetto L, Henriques JF, Tao R, Vedaldi A et al.},
  year = "2018"
}

The visual object tracking VOT2017 challenge results

Kristan M, Leonardis A, Matas J, Felsberg M, Pflugfelder R et al. (2018), IEEE International Conference on Computer Vision Workshops

BibTeX View PDF
@inproceedings{thevisualobject-2018/1,
  title={The visual object tracking VOT2017 challenge results},
  author={Kristan M, Leonardis A, Matas J, Felsberg M, Pflugfelder R et al.},
  year = "2018"
}

End-to-end representation learning for Correlation Filter based tracking

Valmadre JL, Bertinetto L, Henriques, JFDS, Vedaldi A & Torr PH (2017), IEEE International Conference on Computer Vision and Pattern Recognition (CVPR 2017)

BibTeX View PDF
@inproceedings{endtoendreprese-2017/11,
  title={End-to-end representation learning for Correlation Filter based tracking},
  author={Valmadre JL, Bertinetto L, Henriques, JFDS, Vedaldi A & Torr PH},
  year = "2017"
}

Warped convolutions: Efficient invariance to spatial transformations

Henriques JF & Vedaldi A (2017), Proceedings of the 34th International Conference on Machine Learning, 70, 1461-1469

BibTeX
@inproceedings{warpedconvoluti-2017/7,
  title={Warped convolutions: Efficient invariance to spatial transformations},
  author={Henriques JF & Vedaldi A},
  booktitle={ICML | 2017 Thirty-fourth International Conference on Machine Learning},
  pages={1461-1469},
  year = "2017"
}