Skip to main content
Menu

Publications

Showing 50 publications by Iro Laina

Rethinking Image Super-Resolution from Training Data Perspectives

Ohtani G, Tadokoro R, Yamada R, Asano YM, Laina I et al. (2025), 15075, 19-36

BibTeX View PDF
@misc{rethinkingimage-2025/,
  title={Rethinking Image Super-Resolution from Training Data Perspectives},
  author={Ohtani G, Tadokoro R, Yamada R, Asano YM, Laina I et al.},
  year = "2025"
}

Scaling Backwards: Minimal Synthetic Pre-Training?

Nakamura R, Tadokoro R, Yamada R, Asano YM, Laina I et al. (2025), 15073, 153-171

BibTeX View PDF
@misc{scalingbackward-2025/,
  title={Scaling Backwards: Minimal Synthetic Pre-Training?},
  author={Nakamura R, Tadokoro R, Yamada R, Asano YM, Laina I et al.},
  year = "2025"
}

N2F2: hierarchical scene understanding with nested neural feature fields

Bhalgat Y, Laina I, Henriques J, Zisserman A & Vedaldi A (2024), Computer Vision – ECCV 2024 18th European Conference, Milan, Italy, September 29–October 4, 2024, Proceedings, Part LIX, 197-214

BibTeX View PDF
@inproceedings{nfhierarchicals-2024/11,
  title={N2F2: hierarchical scene understanding with nested neural feature fields},
  author={Bhalgat Y, Laina I, Henriques J, Zisserman A & Vedaldi A},
  booktitle={20th European Conference on Computer Vision (ECCV 2024)},
  pages={197-214},
  year = "2024"
}

Contrastive lift: 3D object instance segmentation by slow-fast contrastive fusion

Bhalgat Y, Laina I, Henriques J, Zisserman A & Vedaldi A (2024), Advances in Neural Information Processing Systems 36, 9092

BibTeX
@inproceedings{contrastivelift-2024/10,
  title={Contrastive lift: 3D object instance segmentation by slow-fast contrastive fusion},
  author={Bhalgat Y, Laina I, Henriques J, Zisserman A & Vedaldi A},
  booktitle={37th Conference in Neural Information Processing Systems (NeurIPS 2023)},
  pages={9092},
  year = "2024"
}

Diffusion models for open-vocabulary segmentation

Karazija L, Laina I, Vedaldi A & Rupprecht C (2024), Computer Vision – ECCV 2024: 18th European Conference, Milan, Italy, September 29–October 4, 2024, Proceedings, Part V, 299-317

BibTeX View PDF
@inproceedings{diffusionmodels-2024/10,
  title={Diffusion models for open-vocabulary segmentation},
  author={Karazija L, Laina I, Vedaldi A & Rupprecht C},
  booktitle={20th European Conference on Computer Vision (ECCV 2024)},
  pages={299-317},
  year = "2024"
}

Splatt3R: Zero-shot Gaussian Splatting from Uncalibrated Image Pairs

Smart B, Zheng C, Laina I & Prisacariu VA (2024)

BibTeX View PDF
@misc{splattrzeroshot-2024/8,
  title={Splatt3R: Zero-shot Gaussian Splatting from Uncalibrated Image Pairs},
  author={Smart B, Zheng C, Laina I & Prisacariu VA},
  year = "2024"
}

3D-aware instance segmentation and tracking in egocentric videos

Bhalgat Y, Tschernezki V, Laina I, Henriques J, Vedaldi A et al. (2024)

BibTeX View PDF
@misc{dawareinstances-2024/8,
  title={3D-aware instance segmentation and tracking in egocentric videos},
  author={Bhalgat Y, Tschernezki V, Laina I, Henriques J, Vedaldi A et al.},
  year = "2024"
}

SHAP-EDITOR: instruction-guided latent 3D editing in seconds

Chen M, Xie J, Laina I & Vedaldi A (2024), 2024 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR), 26446-26456

BibTeX View PDF
@inproceedings{shapeditorinstr-2024/5,
  title={SHAP-EDITOR: instruction-guided latent 3D editing in seconds},
  author={Chen M, Xie J, Laina I & Vedaldi A},
  booktitle={Conference on Computer Vision and Pattern Recognition (CVPR 2024)},
  pages={26446-26456},
  year = "2024"
}

When LLMs step into the 3D World: A Survey and Meta-Analysis of 3D Tasks via Multi-modal Large Language Models

Ma X, Bhalgat Y, Smart B, Chen S, Li X et al. (2024)

BibTeX View PDF
@misc{whenllmsstepint-2024/5,
  title={When LLMs step into the 3D World: A Survey and Meta-Analysis of 3D Tasks via Multi-modal Large Language Models},
  author={Ma X, Bhalgat Y, Smart B, Chen S, Li X et al.},
  year = "2024"
}

Training-free layout control with cross-attention guidance

Chen M, Laina I & Vedaldi A (2024), 2024 IEEE/CVF Winter Conference on Applications of Computer Vision (WACV), 5331-5341

BibTeX View PDF
@inproceedings{trainingfreelay-2024/4,
  title={Training-free layout control with cross-attention guidance},
  author={Chen M, Laina I & Vedaldi A},
  booktitle={IEEE/CVF Winter Conference on Applications of Computer Vision (WACV 2024)},
  pages={5331-5341},
  year = "2024"
}

Invisible stitch: generating smooth 3D scenes with depth inpainting

Engstler P, Vedaldi A, Laina I & Rupprecht C (2024)

BibTeX View PDF
@misc{invisiblestitch-2024/4,
  title={Invisible stitch: generating smooth 3D scenes with depth inpainting},
  author={Engstler P, Vedaldi A, Laina I & Rupprecht C},
  year = "2024"
}

DGE: Direct Gaussian 3D editing by consistent multi-view editing

Chen M, Laina I & Vedaldi A (2024)

BibTeX View PDF
@misc{dgedirectgaussi-2024/4,
  title={DGE: Direct Gaussian 3D editing by consistent multi-view editing},
  author={Chen M, Laina I & Vedaldi A},
  year = "2024"
}

N2F2: Hierarchical Scene Understanding with Nested Neural Feature Fields

Bhalgat Y, Laina I, Henriques JF, Zisserman A & Vedaldi A (2024)

BibTeX View PDF
@misc{nfhierarchicals-2024/3,
  title={N2F2: Hierarchical Scene Understanding with Nested Neural Feature Fields},
  author={Bhalgat Y, Laina I, Henriques JF, Zisserman A & Vedaldi A},
  year = "2024"
}

IM-3D: iterative multiview diffusion and reconstruction for high-quality 3D generation

Melas-Kyriazi L, Laina I, Rupprecht C, Neverova N, Vedaldi A et al. (2024)

BibTeX View PDF
@misc{imditerativemul-2024/2,
  title={IM-3D: iterative multiview diffusion and reconstruction for high-quality 3D generation},
  author={Melas-Kyriazi L, Laina I, Rupprecht C, Neverova N, Vedaldi A et al.},
  year = "2024"
}

EPIC Fields: marrying 3D geometry and video understanding

Tschernezki V, Darkhalil A, Zhu Z, Fouhey D, Laina I et al. (2024), Proceedings of Advances in Neural Information Processing Systems (NeurIPS): Track on Datasets and Benchmarks, 2023, 36, 26485-26500

BibTeX
@inproceedings{epicfieldsmarry-2024/1,
  title={EPIC Fields: marrying 3D geometry and video understanding},
  author={Tschernezki V, Darkhalil A, Zhu Z, Fouhey D, Laina I et al.},
  booktitle={Advances in Neural Information Processing Systems (NeurIPS2023)},
  pages={26485-26500},
  year = "2024"
}

SHAP-EDITOR: Instruction-guided Latent 3D Editing in Seconds

Chen M, Xie J, Laina I & Vedaldi A (2023)

BibTeX View PDF
@misc{shapeditorinstr-2023/12,
  title={SHAP-EDITOR: Instruction-guided Latent 3D Editing in Seconds},
  author={Chen M, Xie J, Laina I & Vedaldi A},
  year = "2023"
}

RealFusion: 360 reconstruction of any object from a single image

Melas-Kyriazi L, Laina I, Rupprecht C & Vedaldi A (2023), 2023 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR), 8446-8455

BibTeX View PDF
@inproceedings{realfusionrecon-2023/8,
  title={RealFusion: 360 reconstruction of any object from a single image},
  author={Melas-Kyriazi L, Laina I, Rupprecht C & Vedaldi A},
  booktitle={Conference on Computer Vision and Pattern Recognition (CVPR 2023)},
  pages={8446-8455},
  year = "2023"
}

Diffusion models for open-vocabulary segmentation

Karazija L, Vedaldi A, Laina I & Rupprecht C (2023)

BibTeX View PDF
@misc{diffusionmodels-2023/6,
  title={Diffusion models for open-vocabulary segmentation},
  author={Karazija L, Vedaldi A, Laina I & Rupprecht C},
  year = "2023"
}

Contrastive Lift: 3D Object Instance Segmentation by Slow-Fast Contrastive Fusion

Bhalgat Y, Laina I, Henriques JF, Zisserman A & Vedaldi A (2023)

BibTeX View PDF
@misc{contrastivelift-2023/6,
  title={Contrastive Lift: 3D Object Instance Segmentation by Slow-Fast Contrastive Fusion},
  author={Bhalgat Y, Laina I, Henriques JF, Zisserman A & Vedaldi A},
  year = "2023"
}

EPIC Fields: marrying 3D geometry and video understanding

Tschernezki V, Darkhalil A, Zhu Z, Fouhey D, Laina I et al. (2023)

BibTeX View PDF
@misc{epicfieldsmarry-2023/6,
  title={EPIC Fields: marrying 3D geometry and video understanding},
  author={Tschernezki V, Darkhalil A, Zhu Z, Fouhey D, Laina I et al.},
  year = "2023"
}

Training-free layout control with cross-attention guidance

Chen M, Laina I & Vedaldi A (2023)

BibTeX View PDF
@misc{trainingfreelay-2023/4,
  title={Training-free layout control with cross-attention guidance},
  author={Chen M, Laina I & Vedaldi A},
  year = "2023"
}

Neural feature fusion fields: 3D distillation of self-supervised 2D image representations

Tschernezki V, Laina I, Larlus D & Vedaldi A (2023), 2022 International Conference on 3D Vision (3DV), 443-453

BibTeX View PDF
@inproceedings{neuralfeaturefu-2023/2,
  title={Neural feature fusion fields: 3D distillation of self-supervised 2D image representations},
  author={Tschernezki V, Laina I, Larlus D & Vedaldi A},
  booktitle={10th International Conference on 3D Vision (3DV 2022)},
  pages={443-453},
  year = "2023"
}

RealFusion: 360° reconstruction of any object from a single image

Melas-Kyriazi L, Rupprecht C, Laina I & Vedaldi A (2023)

BibTeX View PDF
@misc{realfusionrecon-2023/2,
  title={RealFusion: 360° reconstruction of any object from a single image},
  author={Melas-Kyriazi L, Rupprecht C, Laina I & Vedaldi A},
  year = "2023"
}

Guess what moves: unsupervised video and image segmentation by anticipating motion

Choudhury S, Karazija L, Laina I, Vedaldi A & Rupprecht C (2022), 33rd British Machine Vision Conference Proceedings

BibTeX
@inproceedings{guesswhatmovesu-2022/11,
  title={Guess what moves: unsupervised video and image segmentation by anticipating motion},
  author={Choudhury S, Karazija L, Laina I, Vedaldi A & Rupprecht C},
  booktitle={33rd British Machine Vision Conference (BMVC 2022)},
  year = "2022"
}

Unsupervised multi-object segmentation by predicting probable motion patterns

Karazija L, Choudhury S, Laina I, Rupprecht C & Vedaldi A (2022)

BibTeX View PDF
@misc{unsupervisedmul-2022/10,
  title={Unsupervised multi-object segmentation by predicting probable motion patterns},
  author={Karazija L, Choudhury S, Laina I, Rupprecht C & Vedaldi A},
  year = "2022"
}

Deep spectral methods: a surprisingly strong baseline for unsupervised semantic segmentation and localization

Melas-Kyriazi L, Rupprecht C, Laina I & Vedaldi A (2022), 2022 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR), 8354-8365

BibTeX View PDF
@inproceedings{deepspectralmet-2022/9,
  title={Deep spectral methods: a surprisingly strong baseline for unsupervised semantic segmentation and localization},
  author={Melas-Kyriazi L, Rupprecht C, Laina I & Vedaldi A},
  booktitle={IEEE/CVF Computer Vision and Pattern Recognition Conference (CVPR 2022)},
  pages={8354-8365},
  year = "2022"
}

Neural feature fusion fields: 3D distillation of self-supervised 2D image representations

Tschernezki V, Laina I, Larlus D & Vedaldi A (2022)

BibTeX View PDF
@misc{neuralfeaturefu-2022/9,
  title={Neural feature fusion fields: 3D distillation of self-supervised 2D image representations},
  author={Tschernezki V, Laina I, Larlus D & Vedaldi A},
  year = "2022"
}

Measuring the interpretability of unsupervised representations via quantized reverse probing

Laina I, Asano YM & Vedaldi A (2022)

BibTeX View PDF
@misc{measuringtheint-2022/9,
  title={Measuring the interpretability of unsupervised representations via quantized reverse probing},
  author={Laina I, Asano YM & Vedaldi A},
  year = "2022"
}

Guess what moves: unsupervised video and image segmentation by anticipating motion

Choudhury S, Karazija L, Laina I, Vedaldi A & Rupprecht C (2022)

BibTeX View PDF
@misc{guesswhatmovesu-2022/5,
  title={Guess what moves: unsupervised video and image segmentation by anticipating motion},
  author={Choudhury S, Karazija L, Laina I, Vedaldi A & Rupprecht C},
  year = "2022"
}

Deep spectral methods: a surprisingly strong baseline for unsupervised semantic segmentation and localization

Melas-Kyriazi L, Rupprecht C, Laina I & Vedaldi A (2022)

BibTeX View PDF
@misc{deepspectralmet-2022/5,
  title={Deep spectral methods: a surprisingly strong baseline for unsupervised semantic segmentation and localization},
  author={Melas-Kyriazi L, Rupprecht C, Laina I & Vedaldi A},
  year = "2022"
}

The curious layperson: fine-grained image recognition without expert labels

Choudhury S, Laina I, Rupprecht C & Vedaldi A (2022), Proceedings of the 32nd British Machine Vision Conference (BMVC 2021)

BibTeX
@inproceedings{thecuriouslaype-2022/3,
  title={The curious layperson: fine-grained image recognition without expert labels},
  author={Choudhury S, Laina I, Rupprecht C & Vedaldi A},
  booktitle={32nd British Machine Vision Conference (BMVC 2021)},
  year = "2022"
}

Unsupervised multi-object segmentation by predicting probable motion patterns

Karazija L, Choudhury S, Laina I, Rupprecht C & Vedaldi A (2022), Advances in Neural Information Processing Systems 35 (NeurIPS 2022), 35

BibTeX
@inproceedings{unsupervisedmul-2022/1,
  title={Unsupervised multi-object segmentation by predicting probable motion patterns},
  author={Karazija L, Choudhury S, Laina I, Rupprecht C & Vedaldi A},
  booktitle={36th Neural Information Processing Systems (NeurIPS 2022)},
  year = "2022"
}

Unsupervised part discovery from contrastive reconstruction

Choudhury S, Laina I, Rupprecht C & Vedaldi A (2021), Proceedings of the 34th Conference on Neural Information Processing Systems (NeuRIPS 2021)

BibTeX
@inproceedings{unsupervisedpar-2021/12,
  title={Unsupervised part discovery from contrastive reconstruction},
  author={Choudhury S, Laina I, Rupprecht C & Vedaldi A},
  booktitle={34th Conference on Neural Information Processing Systems (NeuRIPS 2021)},
  year = "2021"
}

The curious layperson: fine-grained image recognition without expert labels

Choudhury S, Laina I, Rupprecht C & Vedaldi A (2021)

BibTeX View PDF
@misc{thecuriouslaype-2021/11,
  title={The curious layperson: fine-grained image recognition without expert labels},
  author={Choudhury S, Laina I, Rupprecht C & Vedaldi A},
  year = "2021"
}

Unsupervised part discovery from contrastive reconstruction

Choudhury S, Laina I, Rupprecht C & Vedaldi A (2021)

BibTeX View PDF
@misc{unsupervisedpar-2021/11,
  title={Unsupervised part discovery from contrastive reconstruction},
  author={Choudhury S, Laina I, Rupprecht C & Vedaldi A},
  year = "2021"
}

Measuring the interpretability of unsupervised representations via quantized reversed probing

Laina I, Asano Y & Vedaldi A (2021), International Conference on Learning Representations

BibTeX
@inproceedings{measuringtheint-2021/9,
  title={Measuring the interpretability of unsupervised representations via quantized reversed probing},
  author={Laina I, Asano Y & Vedaldi A},
  booktitle={Tenth International Conference on Learning Representations (ICLR 2022)},
  year = "2021"
}

Finding an unsupervised image segmenter in each of your deep generative models

Melas-Kyriazi L, Rupprecht C, Laina I & Vedaldi A (2021), International Conference on Learning Representations

BibTeX
@inproceedings{findinganunsupe-2021/9,
  title={Finding an unsupervised image segmenter in each of your deep generative models},
  author={Melas-Kyriazi L, Rupprecht C, Laina I & Vedaldi A},
  booktitle={ Tenth International Conference on Learning Representations (ICLR 2022)},
  year = "2021"
}

Quantifying learnability and describability of visual concepts emerging in representation learning

Laina I, Fong RC & Vedaldi A (2021), Advances in Neural Information Processing Systems 33, 16, 13112-13126

BibTeX
@inproceedings{quantifyinglear-2021/7,
  title={Quantifying learnability and describability of visual concepts emerging in representation learning},
  author={Laina I, Fong RC & Vedaldi A},
  booktitle={34th Annual Conference on Neural Information Processing Systems (NeurIPS 2020)},
  pages={13112-13126},
  year = "2021"
}

Finding an unsupervised image segmenter in each of your deep generative models

Melas-Kyriazi L, Rupprecht C, Laina I & Vedaldi A (2021)

BibTeX View PDF
@misc{findinganunsupe-2021/5,
  title={Finding an unsupervised image segmenter in each of your deep generative models},
  author={Melas-Kyriazi L, Rupprecht C, Laina I & Vedaldi A},
  year = "2021"
}

The Curious Layperson: Fine-Grained Image Recognition without Expert Labels

Choudhury S, Laina I, Rupprecht C & Vedaldi A (2021), 32nd British Machine Vision Conference, BMVC 2021

BibTeX
@inproceedings{thecuriouslaype-2021/1,
  title={The Curious Layperson: Fine-Grained Image Recognition without Expert Labels},
  author={Choudhury S, Laina I, Rupprecht C & Vedaldi A},
  year = "2021"
}

Quantifying learnability and describability of visual concepts emerging in representation learning

Laina I, Fong RC & Vedaldi A (2020)

BibTeX View PDF
@misc{quantifyinglear-2020/10,
  title={Quantifying learnability and describability of visual concepts emerging in representation learning},
  author={Laina I, Fong RC & Vedaldi A},
  year = "2020"
}

Semantic Image Manipulation Using Scene Graphs

Dhamo H, Farshad A, Laina I, Navab N, Hager GD et al. (2020), 00, 5212-5221

BibTeX View PDF
@inproceedings{semanticimagema-2020/6,
  title={Semantic Image Manipulation Using Scene Graphs},
  author={Dhamo H, Farshad A, Laina I, Navab N, Hager GD et al.},
  booktitle={2020 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)},
  pages={5212-5221},
  year = "2020"
}

Towards Unsupervised Image Captioning with Shared Multimodal Embeddings

Laina I, Rupprecht C & Navab N (2019), 00, 7413-7423

BibTeX View PDF
@inproceedings{towardsunsuperv-2019/11,
  title={Towards Unsupervised Image Captioning with Shared Multimodal Embeddings},
  author={Laina I, Rupprecht C & Navab N},
  booktitle={2019 IEEE/CVF International Conference on Computer Vision (ICCV)},
  pages={7413-7423},
  year = "2019"
}

Dealing with Ambiguity in Robotic Grasping via Multiple Predictions

Ghazaei G, Laina I, Rupprecht C, Tombari F, Navab N et al. (2019), Lecture Notes in Computer Science, 11364, 38-55

BibTeX View PDF
@inproceedings{dealingwithambi-2019/,
  title={Dealing with Ambiguity in Robotic Grasping via Multiple Predictions},
  author={Ghazaei G, Laina I, Rupprecht C, Tombari F, Navab N et al.},
  pages={38-55},
  year = "2019"
}

Guide Me: Interacting with Deep Networks

Rupprecht C, Laina I, Navab N, Hager GD & Tombari F (2018), 8551-8561

BibTeX View PDF
@inproceedings{guidemeinteract-2018/6,
  title={Guide Me: Interacting with Deep Networks},
  author={Rupprecht C, Laina I, Navab N, Hager GD & Tombari F},
  booktitle={2018 IEEE/CVF Conference on Computer Vision and Pattern Recognition},
  pages={8551-8561},
  year = "2018"
}

Learning in an Uncertain World: Representing Ambiguity Through Multiple Hypotheses

Rupprecht C, Laina I, DiPietro R, Baust M, Tombari F et al. (2017), 3611-3620

BibTeX View PDF
@inproceedings{learninginanunc-2017/10,
  title={Learning in an Uncertain World: Representing Ambiguity Through Multiple Hypotheses},
  author={Rupprecht C, Laina I, DiPietro R, Baust M, Tombari F et al.},
  booktitle={2017 IEEE International Conference on Computer Vision (ICCV)},
  pages={3611-3620},
  year = "2017"
}

Concurrent Segmentation and Localization for Tracking of Surgical Instruments

Laina I, Rieke N, Rupprecht C, Vizcaíno JP, Eslami A et al. (2017), Lecture Notes in Computer Science, 10434, 664-672

BibTeX View PDF
@inproceedings{concurrentsegme-2017/,
  title={Concurrent Segmentation and Localization for Tracking of Surgical Instruments},
  author={Laina I, Rieke N, Rupprecht C, Vizcaíno JP, Eslami A et al.},
  pages={664-672},
  year = "2017"
}

Deeper Depth Prediction with Fully Convolutional Residual Networks

Laina I, Rupprecht C, Belagiannis V, Tombari F & Navab N (2016)

BibTeX View PDF
@misc{deeperdepthpred-2016/6,
  title={Deeper Depth Prediction with Fully Convolutional Residual Networks},
  author={Laina I, Rupprecht C, Belagiannis V, Tombari F & Navab N},
  year = "2016"
}

Deeper Depth Prediction with Fully Convolutional Residual Networks

Laina I, Rupprecht C, Belagiannis V, Tombari F & Navab N (0), 239-248

BibTeX View PDF
@inproceedings{deeperdepthpred-/,
  title={Deeper Depth Prediction with Fully Convolutional Residual Networks},
  author={Laina I, Rupprecht C, Belagiannis V, Tombari F & Navab N},
  booktitle={2016 Fourth International Conference on 3D Vision (3DV)},
  pages={239-248}
}

RealFusion: 360 Reconstruction of Any Object from a Single Image

Melas-Kyriazi L, Laina I, Rupprecht C & Vedaldi A (0)

BibTeX
@inproceedings{realfusionrecon-/,
  title={RealFusion: 360 Reconstruction of Any Object from a Single Image},
  author={Melas-Kyriazi L, Laina I, Rupprecht C & Vedaldi A},
  booktitle={Conference on Computer Vision and Pattern Recognition (CVPR), 2023}
}