Publications

2026

Scale Space Diffusion

Soumik Mukhopadhyay, Prateksha Udhayanan, Abhinav Shrivastava

CVPR 2026 new

BibTeX

@inproceedings{mukhopadhyay2026scale,
  title={{Scale Space Diffusion}},
  author={Mukhopadhyay, Soumik and Udhayanan, Prateksha and Shrivastava, Abhinav},
  booktitle={CVPR},
  year={2026}
}

UPLiFT: Efficient Pixel-Dense Feature Upsampling with Local Attenders

Matthew Walmer, Saksham Suri, Anirud Aggarwal, Abhinav Shrivastava

CVPR 2026 new

pdf / webpage / code /

BibTeX

@inproceedings{walmer2026uplift,
  title={{UPLiFT: Efficient Pixel-Dense Feature Upsampling with Local Attenders}},
  author={Walmer, Matthew and Suri, Saksham and Aggarwal, Anirud and Shrivastava, Abhinav},
  booktitle={CVPR},
  year={2026}
  url={https://arxiv.org/abs/2601.17950}
}

Efficient and High-Fidelity Omni Modality Retrieval

Chuong Huynh, Manh Luong, Abhinav Shrivastava

CVPR 2026 new

BibTeX

@inproceedings{huynh2026efficient,
  title={{Efficient and High-Fidelity Omni Modality Retrieval}},
  author={Huynh, Chuong and Luong, Manh and Shrivastava, Abhinav},
  booktitle={CVPR},
  year={2026}
}

Evolutionary Caching to Accelerate Your Off-the-Shelf Diffusion Model

Anirud Aggarwal, Abhinav Shrivastava, Matthew Gwilliam

ICLR 2026 new

pdf / webpage / code /

BibTeX

@inproceedings{aggarwal2026evolutionary,
  title={{Evolutionary Caching to Accelerate Your Off-the-Shelf Diffusion Model}},
  author={Aggarwal, Anirud and Shrivastava, Abhinav and Gwilliam, Matthew},
  booktitle={ICLR},
  year={2026}
  url={https://arxiv.org/abs/2506.15682}
}

NeRV-Diffusion: Diffuse Implicit Neural Representation for Video Synthesis

Yixuan Ren, Hanyu Wang, Hao Chen, Bo He, Abhinav Shrivastava

ICLR 2026 new

pdf / webpage /

BibTeX

@inproceedings{ren2026nervdiffusion,
  title={{NeRV-Diffusion: Diffuse Implicit Neural Representation for Video Synthesis}},
  author={Ren, Yixuan and Wang, Hanyu and Chen, Hao and He, Bo and Shrivastava, Abhinav},
  booktitle={ICLR},
  year={2026}
  url={https://arxiv.org/abs/2509.24353}
}

Towards Understanding Best Practices for Quantization of Vision-Language Models

Gautom Das, Vincent La, Ethan Lau, Abhinav Shrivastava, Matthew Gwilliam

arXiv 2026 new

pdf / code /

BibTeX

@article{das2026towards,
  title={{Towards Understanding Best Practices for Quantization of Vision-Language Models}},
  author={Das, Gautom and La, Vincent and Lau, Ethan and Shrivastava, Abhinav and Gwilliam, Matthew},
  journal={arXiv},
  year={2026}
  url={https://arxiv.org/abs/2601.15287}
}

VeriGraph: Scene Graphs for Execution Verifiable Robot Planning

Daniel Ekpo, Archana Swaminathan, Mara Levy, Saksham Suri, Chuong Huynh, Abhinav Shrivastava

ICRA 2026 new

pdf /

BibTeX

@inproceedings{ekpo2026verigraph,
  title={{VeriGraph: Scene Graphs for Execution Verifiable Robot Planning}},
  author={Ekpo, Daniel and Swaminathan, Archana and Levy, Mara and Suri, Saksham and Huynh, Chuong and Shrivastava, Abhinav},
  booktitle={ICRA},
  year={2026}
  url={https://arxiv.org/abs/2411.10446}
}

Growing Visual Generative Capacity for Pre-Trained MLLMs

Hanyu Wang, Jiaming Han, Ziyan Yang, Abhinav Shrivastava

MM Intelligence Workshop, ICLR 2026

pdf / webpage / code /

BibTeX

@inproceedings{wang2026growing,
  title={{Growing Visual Generative Capacity for Pre-Trained MLLMs}},
  author={Wang, Hanyu and Han, Jiaming and Yang, Ziyan and Shrivastava, Abhinav},
  booktitle={MM Intelligence Workshop, ICLR},
  year={2026}
  url={https://arxiv.org/abs/2510.01546}
}

How to Design and Train Your Implicit Neural Representation for Video Compression

Matthew Gwilliam, Roy Zhang, Namitha Padmanabhan, Hongyang Du, Abhinav Shrivastava

WACV 2026 new

pdf / webpage / code /

BibTeX

@inproceedings{gwilliam2026how,
  title={{How to Design and Train Your Implicit Neural Representation for Video Compression}},
  author={Gwilliam, Matthew and Zhang, Roy and Padmanabhan, Namitha and Du, Hongyang and Shrivastava, Abhinav},
  booktitle={WACV},
  year={2026}
  url={https://arxiv.org/abs/2506.24127}
}

2025

Characterizing Motion Encoding in Video Diffusion Timesteps

Vatsal Baherwani, Yixuan Ren, Abhinav Shrivastava

arXiv 2025

pdf /

BibTeX

@article{baherwani2025characterizing,
  title={{Characterizing Motion Encoding in Video Diffusion Timesteps}},
  author={Baherwani, Vatsal and Ren, Yixuan and Shrivastava, Abhinav},
  journal={arXiv},
  year={2025}
  url={https://arxiv.org/abs/2512.22175}
}

Imagine, Verify, Execute: Memory-guided Agentic Exploration with Vision-Language Models

Seungjae Lee, Daniel Ekpo, Haowen Liu, Furong Huang, Abhinav Shrivastava, Jia-Bin Huang

CoRL 2025

pdf / webpage /

BibTeX

@inproceedings{lee2025imagine,
  title={{Imagine, Verify, Execute: Memory-guided Agentic Exploration with Vision-Language Models}},
  author={Lee, Seungjae and Ekpo, Daniel and Liu, Haowen and Huang, Furong and Shrivastava, Abhinav and Huang, Jia-Bin},
  booktitle={CoRL},
  year={2025}
  url={https://arxiv.org/abs/2505.07815}
}

Towards Multimodal Understanding via Stable Diffusion as a Task-Aware Feature Extractor

Vatsal Agarwal, Matthew Gwilliam, Gefen Kohavi, Eshan Verma, Daniel Ulbricht, Abhinav Shrivastava

arXiv 2025

pdf / webpage /

BibTeX

@article{agarwal2025towards,
  title={{Towards Multimodal Understanding via Stable Diffusion as a Task-Aware Feature Extractor}},
  author={Agarwal, Vatsal and Gwilliam, Matthew and Kohavi, Gefen and Verma, Eshan and Ulbricht, Daniel and Shrivastava, Abhinav},
  journal={arXiv},
  year={2025}
  url={https://arxiv.org/abs/2507.07106}
}

Trokens: Semantic-Aware Relational Trajectory Tokens for Few-Shot Action Recognition

Pulkit Kumar, Shuaiyi Huang, Matthew Walmer, Sai Saketh Rambhatla, Abhinav Shrivastava

ICCV 2025

pdf / webpage / code /

BibTeX

@inproceedings{kumar2025trokens,
  title={{Trokens: Semantic-Aware Relational Trajectory Tokens for Few-Shot Action Recognition}},
  author={Kumar, Pulkit and Huang, Shuaiyi and Walmer, Matthew and Rambhatla, Sai Saketh and Shrivastava, Abhinav},
  booktitle={ICCV},
  year={2025}
  url={https://arxiv.org/abs/2508.03695}
}

MAPS: Memory Augmented Panoptic Segmentation

Vatsal Agarwal, Saksham Suri, Max Ehrlich, Abhinav Shrivastava

MemVis Workshop, ICCV 2025 oral

pdf /

BibTeX

@inproceedings{agarwal2025maps,
  title={{MAPS: Memory Augmented Panoptic Segmentation}},
  author={Agarwal, Vatsal and Suri, Saksham and Ehrlich, Max and Shrivastava, Abhinav},
  booktitle={MemVis Workshop, ICCV},
  year={2025}
}

Multi-entity Video Transformers for Fine-Grained Video Representation Learning

Matthew Walmer, Rose Kanjirathinkal, Kai-Sheng Tai, Keyur Muzumdar, Taipeng Tian, Abhinav Shrivastava

FGVC Workshop, CVPR 2025

pdf / code /

BibTeX

@inproceedings{walmer2025multientity,
  title={{Multi-entity Video Transformers for Fine-Grained Video Representation Learning}},
  author={Walmer, Matthew and Kanjirathinkal, Rose and Tai, Kai-Sheng and Muzumdar, Keyur and Tian, Taipeng and Shrivastava, Abhinav},
  booktitle={FGVC Workshop, CVPR},
  year={2025}
  url={https://arxiv.org/abs/2311.10873}
}

CoLLM: A Large Language Model for Composed Image Retrieval

Chuong Huynh, Jinyu Yang, Ashish Tawari, Mubarak Shah, Son Tran, Raffay Hamid, Trishul Chilimbi, Abhinav Shrivastava

CVPR 2025

pdf / webpage / code /

BibTeX

@inproceedings{huynh2025collm,
  title={{CoLLM: A Large Language Model for Composed Image Retrieval}},
  author={Huynh, Chuong and Yang, Jinyu and Tawari, Ashish and Shah, Mubarak and Tran, Son and Hamid, Raffay and Chilimbi, Trishul and Shrivastava, Abhinav},
  booktitle={CVPR},
  year={2025}
  url={https://arxiv.org/abs/2503.19910}
}

LARP: Tokenizing Videos with a Learned Autoregressive Generative Prior

Hanyu Wang, Saksham Suri, Yixuan Ren, Hao Chen, Abhinav Shrivastava

ICLR 2025 oral

pdf / webpage / code /

BibTeX

@inproceedings{wang2025larp,
  title={{LARP: Tokenizing Videos with a Learned Autoregressive Generative Prior}},
  author={Wang, Hanyu and Suri, Saksham and Ren, Yixuan and Chen, Hao and Shrivastava, Abhinav},
  booktitle={ICLR},
  year={2025}
  url={https://arxiv.org/abs/2410.21264}
}

P3-PO: Prescriptive Point Priors for Visuo-Spatial Generalization of Robot Policies

Mara Levy, Siddhant Haldar, Lerrel Pinto, Abhinav Shrivastava

ICRA 2025

pdf / webpage / code /

BibTeX

@inproceedings{levy2025ppo,
  title={{P3-PO: Prescriptive Point Priors for Visuo-Spatial Generalization of Robot Policies}},
  author={Levy, Mara and Haldar, Siddhant and Pinto, Lerrel and Shrivastava, Abhinav},
  booktitle={ICRA},
  year={2025}
  url={https://arxiv.org/abs/2412.06784}
}

TREND: Tri-teaching for Robust Preference-based Reinforcement Learning with Demonstrations

Shuaiyi Huang, Mara Levy, Anubhav, Daniel Ekpo, Ruijie Zheng, Abhinav Shrivastava

ICRA 2025

pdf / webpage /

BibTeX

@inproceedings{huang2025trend,
  title={{TREND: Tri-teaching for Robust Preference-based Reinforcement Learning with Demonstrations}},
  author={Huang, Shuaiyi and Levy, Mara and Anubhav and Ekpo, Daniel and Zheng, Ruijie and Shrivastava, Abhinav},
  booktitle={ICRA},
  year={2025}
  url={https://arxiv.org/abs/2505.06079}
}

A Video is Worth 10,000 Words: Training and Benchmarking with Diverse Captions for Better Long Video Retrieval

Matthew Gwilliam, Michael Cogswell, Meng Ye, Karan Sikka, Abhinav Shrivastava, Ajay Divakaran

WACV 2025

pdf / webpage /

BibTeX

@inproceedings{gwilliam2025a,
  title={{A Video is Worth 10,000 Words: Training and Benchmarking with Diverse Captions for Better Long Video Retrieval}},
  author={Gwilliam, Matthew and Cogswell, Michael and Ye, Meng and Sikka, Karan and Shrivastava, Abhinav and Divakaran, Ajay},
  booktitle={WACV},
  year={2025}
  url={https://arxiv.org/abs/2312.00115}
}

Unified Framework for Open-World Compositional Zero-shot Learning

Hirunima Jayasekara, Khoi Pham, Nirat Saini, Abhinav Shrivastava

WACV 2025

pdf / code /

BibTeX

@inproceedings{jayasekara2025unified,
  title={{Unified Framework for Open-World Compositional Zero-shot Learning}},
  author={Jayasekara, Hirunima and Pham, Khoi and Saini, Nirat and Shrivastava, Abhinav},
  booktitle={WACV},
  year={2025}
  url={https://arxiv.org/abs/2412.04083}
}

2024

Efficient Continuous Video Flow Model for Video Prediction

Gaurav Shrivastava, Abhinav Shrivastava

arXiv 2024

pdf /

BibTeX

@article{shrivastava2024efficient,
  title={{Efficient Continuous Video Flow Model for Video Prediction}},
  author={Shrivastava, Gaurav and Shrivastava, Abhinav},
  journal={arXiv},
  year={2024}
  url={https://arxiv.org/abs/2412.05633}
}

AutoHallusion: Automatic Generation of Hallucination Benchmarks for Vision-Language Models

Xiyang Wu, Tianrui Guan, Dianqi Li, Shuaiyi Huang, Xiaoyu Liu, Xijun Wang, Ruiqi Xian, Abhinav Shrivastava, Furong Huang, Jordan Boyd-Graber, Tianyi Zhou, Dinesh Manocha

EMNLP Findings 2024

pdf / webpage / code /

BibTeX

@inproceedings{wu2024autohallusion,
  title={{AutoHallusion: Automatic Generation of Hallucination Benchmarks for Vision-Language Models}},
  author={Wu, Xiyang and Guan, Tianrui and Li, Dianqi and Huang, Shuaiyi and Liu, Xiaoyu and Wang, Xijun and Xian, Ruiqi and Shrivastava, Abhinav and Huang, Furong and Boyd-Graber, Jordan and Zhou, Tianyi and Manocha, Dinesh},
  booktitle={EMNLP Findings},
  year={2024}
  url={https://arxiv.org/abs/2406.10900}
}

QUEEN: QUantized Efficient ENcoding of Dynamic Gaussians for Streaming Free-viewpoint Videos

Sharath Girish, Tianye Li, Amrita Mazumdar, Abhinav Shrivastava, David Luebke, Shalini De Mello

NeurIPS 2024

pdf / webpage / code / video /

BibTeX

@inproceedings{girish2024queen,
  title={{QUEEN: QUantized Efficient ENcoding of Dynamic Gaussians for Streaming Free-viewpoint Videos}},
  author={Girish, Sharath and Li, Tianye and Mazumdar, Amrita and Shrivastava, Abhinav and Luebke, David and Mello, Shalini De},
  booktitle={NeurIPS},
  year={2024}
  url={https://arxiv.org/abs/2412.04469}
}

Coarse to Fine Human Mesh Recovery with Transformers

Vatsal Agarwal, Mara Levy, Max Ehrlich, Yucheng Tang, Nanxuan Zhang, Abhinav Shrivastava

T-CAP Workshop, ECCV 2024

pdf /

BibTeX

@inproceedings{agarwal2024coarse,
  title={{Coarse to Fine Human Mesh Recovery with Transformers}},
  author={Agarwal, Vatsal and Levy, Mara and Ehrlich, Max and Tang, Yucheng and Zhang, Nanxuan and Shrivastava, Abhinav},
  booktitle={T-CAP Workshop, ECCV},
  year={2024}
  url={https://link.springer.com/chapter/10.1007/978-3-031-91575-8_18}
}

Customize-A-Video: One-Shot Motion Customization of Text-to-Video Diffusion Models

Yixuan Ren, Yang Zhou, Jimei Yang, Jing Shi, Difan Liu, Feng Liu, Mingi Kwon, Abhinav Shrivastava

ECCV 2024

pdf / webpage /

BibTeX

@inproceedings{ren2024customizeavideo,
  title={{Customize-A-Video: One-Shot Motion Customization of Text-to-Video Diffusion Models}},
  author={Ren, Yixuan and Zhou, Yang and Yang, Jimei and Shi, Jing and Liu, Difan and Liu, Feng and Kwon, Mingi and Shrivastava, Abhinav},
  booktitle={ECCV},
  year={2024}
  url={https://arxiv.org/abs/2402.14780}
}

Do text-free diffusion models learn discriminative visual representations?

Soumik Mukhopadhyay, Matthew Gwilliam, Yosuke Yamaguchi, Vatsal Agarwal, Namitha Padmanabhan, Archana Swaminathan, Tianyi Zhou, Jun Ohya, Abhinav Shrivastava

ECCV 2024

pdf / webpage / code /

BibTeX

@inproceedings{mukhopadhyay2024do,
  title={{Do text-free diffusion models learn discriminative visual representations?}},
  author={Mukhopadhyay, Soumik and Gwilliam, Matthew and Yamaguchi, Yosuke and Agarwal, Vatsal and Padmanabhan, Namitha and Swaminathan, Archana and Zhou, Tianyi and Ohya, Jun and Shrivastava, Abhinav},
  booktitle={ECCV},
  year={2024}
  url={https://arxiv.org/abs/2311.17921}
}

EAGLES: Efficient Accelerated 3D Gaussians with Lightweight EncodingS

Sharath Girish, Kamal Gupta, Abhinav Shrivastava

ECCV 2024

pdf / webpage / code /

BibTeX

@inproceedings{girish2024eagles,
  title={{EAGLES: Efficient Accelerated 3D Gaussians with Lightweight EncodingS}},
  author={Girish, Sharath and Gupta, Kamal and Shrivastava, Abhinav},
  booktitle={ECCV},
  year={2024}
  url={https://arxiv.org/abs/2312.04564}
}

Fast Encoding and Decoding for Implicit Video Representation

Hao Chen, Saining Xie, Ser-Nam Lim, Abhinav Shrivastava

ECCV 2024

pdf / webpage / code /

BibTeX

@inproceedings{chen2024fast,
  title={{Fast Encoding and Decoding for Implicit Video Representation}},
  author={Chen, Hao and Xie, Saining and Lim, Ser-Nam and Shrivastava, Abhinav},
  booktitle={ECCV},
  year={2024}
  url={https://arxiv.org/abs/2409.19429}
}

Investigating Style Similarity in Diffusion Models

Gowthami Somepalli, Anubhav, Kamal Gupta, Shramay Palta, Micah Goldblum, Jonas Geiping, Abhinav Shrivastava, Tom Goldstein

ECCV 2024

pdf / webpage / code /

BibTeX

@inproceedings{somepalli2024investigating,
  title={{Investigating Style Similarity in Diffusion Models}},
  author={Somepalli, Gowthami and Anubhav and Gupta, Kamal and Palta, Shramay and Goldblum, Micah and Geiping, Jonas and Shrivastava, Abhinav and Goldstein, Tom},
  booktitle={ECCV},
  year={2024}
  url={https://arxiv.org/abs/2404.01292}
}

Latent-INR: A Flexible Framework for Implicit Representations of Videos with Discriminative Semantics

Shishira R Maiya, Anubhav, Matthew Gwilliam, Max Ehrlich, Abhinav Shrivastava

ECCV 2024

pdf / webpage /

BibTeX

@inproceedings{maiya2024latentinr,
  title={{Latent-INR: A Flexible Framework for Implicit Representations of Videos with Discriminative Semantics}},
  author={Maiya, Shishira R and Anubhav and Gwilliam, Matthew and Ehrlich, Max and Shrivastava, Abhinav},
  booktitle={ECCV},
  year={2024}
  url={https://arxiv.org/abs/2408.02672}
}

LEIA: Latent View-invariant Embeddings for Implicit 3D Articulation

Archana Swaminathan, Anubhav, Kamal Gupta, Shishira R Maiya, Vatsal Agarwal, Abhinav Shrivastava

ECCV 2024

pdf / webpage /

BibTeX

@inproceedings{swaminathan2024leia,
  title={{LEIA: Latent View-invariant Embeddings for Implicit 3D Articulation}},
  author={Swaminathan, Archana and Anubhav and Gupta, Kamal and Maiya, Shishira R and Agarwal, Vatsal and Shrivastava, Abhinav},
  booktitle={ECCV},
  year={2024}
  url={https://arxiv.org/abs/2409.06703}
}

LiFT: A Surprisingly Simple Lightweight Feature Transform for Dense ViT Descriptors

Saksham Suri, Matthew Walmer, Kamal Gupta, Abhinav Shrivastava

ECCV 2024

pdf / webpage / code /

BibTeX

@inproceedings{suri2024lift,
  title={{LiFT: A Surprisingly Simple Lightweight Feature Transform for Dense ViT Descriptors}},
  author={Suri, Saksham and Walmer, Matthew and Gupta, Kamal and Shrivastava, Abhinav},
  booktitle={ECCV},
  year={2024}
  url={https://arxiv.org/abs/2403.14625}
}

Quantifying NBA Shot Quality: A Deep Network Approach

Archit Kambhamettu, Abhinav Shrivastava, Matthew Gwilliam

ACM MMSports 2024

BibTeX

@inproceedings{kambhamettu2024quantifying,
  title={{Quantifying NBA Shot Quality: A Deep Network Approach}},
  author={Kambhamettu, Archit and Shrivastava, Abhinav and Gwilliam, Matthew},
  booktitle={ACM MMSports},
  year={2024}
}

Trajectory-aligned Space-time Tokens for Few-shot Action Recognition

Pulkit Kumar, Namitha Padmanabhan, Luke Luo, Sai Saketh Rambhatla, Abhinav Shrivastava

ECCV 2024

pdf / webpage / code /

BibTeX

@inproceedings{kumar2024trajectoryaligned,
  title={{Trajectory-aligned Space-time Tokens for Few-shot Action Recognition}},
  author={Kumar, Pulkit and Padmanabhan, Namitha and Luo, Luke and Rambhatla, Sai Saketh and Shrivastava, Abhinav},
  booktitle={ECCV},
  year={2024}
  url={https://arxiv.org/abs/2407.18249}
}

ARDuP: Active Region Video Diffusion for Universal Policies

Shuaiyi Huang, Mara Levy, Zhenyu Jiang, Anima Anandkumar, Yuke Zhu, Linxi Fan, De-An Huang, Abhinav Shrivastava

IROS 2024

pdf /

BibTeX

@inproceedings{huang2024ardup,
  title={{ARDuP: Active Region Video Diffusion for Universal Policies}},
  author={Huang, Shuaiyi and Levy, Mara and Jiang, Zhenyu and Anandkumar, Anima and Zhu, Yuke and Fan, Linxi and Huang, De-An and Shrivastava, Abhinav},
  booktitle={IROS},
  year={2024}
  url={https://arxiv.org/abs/2406.13301}
}

Challenges, Evaluation and Opportunities for Open-World Learning

Mayank Kejriwal, Eric Kildebeck, Robert Steininger, Abhinav Shrivastava

Nature Machine Intelligence 2024

pdf /

BibTeX

@article{kejriwal2024challenges,
  title={{Challenges, Evaluation and Opportunities for Open-World Learning}},
  author={Kejriwal, Mayank and Kildebeck, Eric and Steininger, Robert and Shrivastava, Abhinav},
  journal={Nature Machine Intelligence},
  year={2024}
  url={https://www.nature.com/articles/s42256-024-00852-4}
}

Agglomerative Clustering of Atomic Actions for Unsupervised Action Segmentation

Pulkit Kumar, Austin Myers, Anurag Arnab, David A. Ross, Abhinav Shrivastava, Sudheendra Vijayanarasimhan

LPVL Workshop, CVPR 2024

BibTeX

@inproceedings{kumar2024agglomerative,
  title={{Agglomerative Clustering of Atomic Actions for Unsupervised Action Segmentation}},
  author={Kumar, Pulkit and Myers, Austin and Arnab, Anurag and Ross, David A. and Shrivastava, Abhinav and Vijayanarasimhan, Sudheendra},
  booktitle={LPVL Workshop, CVPR},
  year={2024}
}

UVIS: Unsupervised Video Instance Segmentation

Shuaiyi Huang, Saksham Suri, Kamal Gupta, Sai Saketh Rambhatla, Ser-Nam Lim, Abhinav Shrivastava

L3D Workshop, CVPR 2024

pdf /

BibTeX

@inproceedings{huang2024uvis,
  title={{UVIS: Unsupervised Video Instance Segmentation}},
  author={Huang, Shuaiyi and Suri, Saksham and Gupta, Kamal and Rambhatla, Sai Saketh and Lim, Ser-Nam and Shrivastava, Abhinav},
  booktitle={L3D Workshop, CVPR},
  year={2024}
  url={https://arxiv.org/abs/2406.06908}
}

V-VIPE: Variational View Invariant Pose Embedding

Mara Levy, Abhinav Shrivastava

RHOI Workshop, CVPR 2024

pdf / webpage /

BibTeX

@inproceedings{levy2024vvipe,
  title={{V-VIPE: Variational View Invariant Pose Embedding}},
  author={Levy, Mara and Shrivastava, Abhinav},
  booktitle={RHOI Workshop, CVPR},
  year={2024}
  url={https://arxiv.org/abs/2407.07092}
}

What is Point Supervision Worth in Video Instance Segmentation?

Shuaiyi Huang, De-An Huang, Zhiding Yu, Shiyi Lan, Subhashree Radhakrishnan, Jose M. Alvarez, Abhinav Shrivastava, Anima Anandkumar

L3D Workshop, CVPR 2024

pdf /

BibTeX

@inproceedings{huang2024what,
  title={{What is Point Supervision Worth in Video Instance Segmentation?}},
  author={Huang, Shuaiyi and Huang, De-An and Yu, Zhiding and Lan, Shiyi and Radhakrishnan, Subhashree and Alvarez, Jose M. and Shrivastava, Abhinav and Anandkumar, Anima},
  booktitle={L3D Workshop, CVPR},
  year={2024}
  url={https://arxiv.org/abs/2404.01990}
}

Beyond Seen Primitive Concepts and Attribute-Object Compositional Learning

Nirat Saini, Khoi Pham, Abhinav Shrivastava

CVPR 2024

pdf / webpage /

BibTeX

@inproceedings{saini2024beyond,
  title={{Beyond Seen Primitive Concepts and Attribute-Object Compositional Learning}},
  author={Saini, Nirat and Pham, Khoi and Shrivastava, Abhinav},
  booktitle={CVPR},
  year={2024}
  url={https://openaccess.thecvf.com/content/CVPR2024/papers/Saini_Beyond_Seen_Primitive_Concepts_and_Attribute-Object_Compositional_Learning_CVPR_2024_paper.pdf}
}

Composing Object Relations and Attributes for Image-Text Matching

Khoi Pham, Chuong Huynh, Ser-Nam Lim, Abhinav Shrivastava

CVPR 2024

pdf / code /

BibTeX

@inproceedings{pham2024composing,
  title={{Composing Object Relations and Attributes for Image-Text Matching}},
  author={Pham, Khoi and Huynh, Chuong and Lim, Ser-Nam and Shrivastava, Abhinav},
  booktitle={CVPR},
  year={2024}
  url={https://arxiv.org/abs/2406.11820}
}

Explaining the Implicit Neural Canvas (XINC): Connecting Pixels to Neurons by Tracing their Contributions

Namitha Padmanabhan, Matthew Gwilliam, Pulkit Kumar, Shishira R Maiya, Max Ehrlich, Abhinav Shrivastava

CVPR 2024

pdf / webpage / code /

BibTeX

@inproceedings{padmanabhan2024explaining,
  title={{Explaining the Implicit Neural Canvas (XINC): Connecting Pixels to Neurons by Tracing their Contributions}},
  author={Padmanabhan, Namitha and Gwilliam, Matthew and Kumar, Pulkit and Maiya, Shishira R and Ehrlich, Max and Shrivastava, Abhinav},
  booktitle={CVPR},
  year={2024}
  url={https://arxiv.org/abs/2401.10217}
}

MA-LMM: Memory-Augmented Large Multimodal Model for Long-Term Video Understanding

Bo He, Hengduo Li, Young Kyun Jang, Menglin Jia, Xuefei Cao, Anshul Shah, Ser-Nam Lim, Abhinav Shrivastava

CVPR 2024

pdf / webpage / code /

BibTeX

@inproceedings{he2024malmm,
  title={{MA-LMM: Memory-Augmented Large Multimodal Model for Long-Term Video Understanding}},
  author={He, Bo and Li, Hengduo and Jang, Young Kyun and Jia, Menglin and Cao, Xuefei and Shah, Anshul and Lim, Ser-Nam and Shrivastava, Abhinav},
  booktitle={CVPR},
  year={2024}
  url={https://arxiv.org/abs/2404.05726}
}

MaGGIe: Masked Guided Gradual Human Instance Matting

Chuong Huynh, Seoung Wug Oh, Abhinav Shrivastava, Joon-Young Lee

CVPR 2024

pdf / webpage / code /

BibTeX

@inproceedings{huynh2024maggie,
  title={{MaGGIe: Masked Guided Gradual Human Instance Matting}},
  author={Huynh, Chuong and Oh, Seoung Wug and Shrivastava, Abhinav and Lee, Joon-Young},
  booktitle={CVPR},
  year={2024}
  url={https://arxiv.org/abs/2404.16035}
}

Video Prediction by Modeling Videos as Continuous Multi-Dimensional Processes

Gaurav Shrivastava, Abhinav Shrivastava

CVPR 2024

pdf / webpage /

BibTeX

@inproceedings{shrivastava2024video,
  title={{Video Prediction by Modeling Videos as Continuous Multi-Dimensional Processes}},
  author={Shrivastava, Gaurav and Shrivastava, Abhinav},
  booktitle={CVPR},
  year={2024}
  url={https://arxiv.org/abs/2412.04929}
}

Video Decomposition Prior: Editing Videos Layer by Layer

Gaurav Shrivastava, Ser-Nam Lim, Abhinav Shrivastava

ICLR 2024

pdf / webpage /

BibTeX

@inproceedings{shrivastava2024video,
  title={{Video Decomposition Prior: Editing Videos Layer by Layer}},
  author={Shrivastava, Gaurav and Lim, Ser-Nam and Shrivastava, Abhinav},
  booktitle={ICLR},
  year={2024}
  url={https://arxiv.org/abs/2412.04930}
}

WAYEX: Waypoint Exploration using a Single Demonstration

Mara Levy, Nirat Saini, Abhinav Shrivastava

ICRA 2024

pdf / webpage /

BibTeX

@inproceedings{levy2024wayex,
  title={{WAYEX: Waypoint Exploration using a Single Demonstration}},
  author={Levy, Mara and Saini, Nirat and Shrivastava, Abhinav},
  booktitle={ICRA},
  year={2024}
  url={https://arxiv.org/abs/2407.15849}
}

Content-Aware Image Color Editing with Auxiliary Color Restoration Tasks

Yixuan Ren, Jing Shi, Zhifei Zhang, Yifei Fan, Zhe Lin, Bo He, Abhinav Shrivastava

WACV 2024

pdf /

BibTeX

@inproceedings{ren2024contentaware,
  title={{Content-Aware Image Color Editing with Auxiliary Color Restoration Tasks}},
  author={Ren, Yixuan and Shi, Jing and Zhang, Zhifei and Fan, Yifei and Lin, Zhe and He, Bo and Shrivastava, Abhinav},
  booktitle={WACV},
  year={2024}
  url={https://openaccess.thecvf.com/content/WACV2024/papers/Ren_Content-Aware_Image_Color_Editing_With_Auxiliary_Color_Restoration_Tasks_WACV_2024_paper.pdf}
}

Diff2Lip: Audio Conditioned Diffusion Models for Lip-Synchronization

Soumik Mukhopadhyay, Saksham Suri, Ravi Teja Gadde, Abhinav Shrivastava

WACV 2024

pdf / webpage / code /

BibTeX

@inproceedings{mukhopadhyay2024difflip,
  title={{Diff2Lip: Audio Conditioned Diffusion Models for Lip-Synchronization}},
  author={Mukhopadhyay, Soumik and Suri, Saksham and Gadde, Ravi Teja and Shrivastava, Abhinav},
  booktitle={WACV},
  year={2024}
  url={https://arxiv.org/abs/2308.09716}
}

GRIT: GAN Residuals for Paired Image-to-Image Translation

Saksham Suri, Moustafa Meshry, Larry Davis, Abhinav Shrivastava

WACV 2024

pdf / webpage /

BibTeX

@inproceedings{suri2024grit,
  title={{GRIT: GAN Residuals for Paired Image-to-Image Translation}},
  author={Suri, Saksham and Meshry, Moustafa and Davis, Larry and Shrivastava, Abhinav},
  booktitle={WACV},
  year={2024}
  url={https://www.cs.umd.edu/~sakshams/grit/resources/GRIT_main_paper.pdf}
}

Leveraging Bitstream Metadata for Fast, Accurate, Generalized Compressed Video Quality Enhancement

Max Ehrlich, Jon Barker, Namitha Padmanabhan, Larry Davis, Andrew Tao, Bryan Catanzaro, Abhinav Shrivastava

WACV 2024

pdf /

BibTeX

@inproceedings{ehrlich2024leveraging,
  title={{Leveraging Bitstream Metadata for Fast, Accurate, Generalized Compressed Video Quality Enhancement}},
  author={Ehrlich, Max and Barker, Jon and Padmanabhan, Namitha and Davis, Larry and Tao, Andrew and Catanzaro, Bryan and Shrivastava, Abhinav},
  booktitle={WACV},
  year={2024}
  url={https://arxiv.org/abs/2202.00011}
}

Multimodality-guided Image Style Transfer using Cross-modal GAN Inversion

Hanyu Wang, Pengxiang Wu, Kevin Dela Rosa, Chen Wang, Abhinav Shrivastava

WACV 2024

pdf / webpage / code /

BibTeX

@inproceedings{wang2024multimodalityguided,
  title={{Multimodality-guided Image Style Transfer using Cross-modal GAN Inversion}},
  author={Wang, Hanyu and Wu, Pengxiang and Rosa, Kevin Dela and Wang, Chen and Shrivastava, Abhinav},
  booktitle={WACV},
  year={2024}
  url={https://arxiv.org/abs/2312.01671}
}

2023

Video Dynamics Prior: An Internal Learning Approach for Robust Video Enhancements

Gaurav Shrivastava, Ser-Nam Lim, Abhinav Shrivastava

NeurIPS 2023

pdf / webpage /

BibTeX

@inproceedings{shrivastava2023video,
  title={{Video Dynamics Prior: An Internal Learning Approach for Robust Video Enhancements}},
  author={Shrivastava, Gaurav and Lim, Ser-Nam and Shrivastava, Abhinav},
  booktitle={NeurIPS},
  year={2023}
  url={https://arxiv.org/abs/2312.07835}
}

A Frequency Perspective of Adversarial Robustness

Shishira R Maiya, Max Ehrlich, Vatsal Agarwal, Ser-Nam Lim, Tom Goldstein, Abhinav Shrivastava

BMVC 2023

pdf /

BibTeX

@inproceedings{maiya2023a,
  title={{A Frequency Perspective of Adversarial Robustness}},
  author={Maiya, Shishira R and Ehrlich, Max and Agarwal, Vatsal and Lim, Ser-Nam and Goldstein, Tom and Shrivastava, Abhinav},
  booktitle={BMVC},
  year={2023}
  url={https://arxiv.org/abs/2111.00861}
}

ASIC: Aligning Sparse in-the-wild Image Collections

Kamal Gupta, Varun Jampani, Carlos Esteves, Abhinav Shrivastava, Ameesh Makadia, Noah Snavely, Abhishek Kar

ICCV 2023 oral

pdf / webpage / video /

BibTeX

@inproceedings{gupta2023asic,
  title={{ASIC: Aligning Sparse in-the-wild Image Collections}},
  author={Gupta, Kamal and Jampani, Varun and Esteves, Carlos and Shrivastava, Abhinav and Makadia, Ameesh and Snavely, Noah and Kar, Abhishek},
  booktitle={ICCV},
  year={2023}
  url={https://arxiv.org/abs/2303.16201}
}

BT2: Backward-compatible Training with Basis Transformation

Yifei Zhou, Zilu Li, Abhinav Shrivastava, Hengshuang Zhao, Antonio Torralba, Taipeng Tian, Ser-Nam Lim

ICCV 2023

pdf /

BibTeX

@inproceedings{zhou2023bt,
  title={{BT2: Backward-compatible Training with Basis Transformation}},
  author={Zhou, Yifei and Li, Zilu and Shrivastava, Abhinav and Zhao, Hengshuang and Torralba, Antonio and Tian, Taipeng and Lim, Ser-Nam},
  booktitle={ICCV},
  year={2023}
  url={https://arxiv.org/abs/2211.03989}
}

Chop & Learn: Recognizing and Generating Object-State Compositions

Nirat Saini, Hanyu Wang, Archana Swaminathan, Vinoj Jayasundara, Bo He, Kamal Gupta, Abhinav Shrivastava

ICCV 2023

pdf / webpage / data /

BibTeX

@inproceedings{saini2023chop,
  title={{Chop & Learn: Recognizing and Generating Object-State Compositions}},
  author={Saini, Nirat and Wang, Hanyu and Swaminathan, Archana and Jayasundara, Vinoj and He, Bo and Gupta, Kamal and Shrivastava, Abhinav},
  booktitle={ICCV},
  year={2023}
  url={https://arxiv.org/abs/2309.14339}
}

MOST: Multiple Object Localization with Self-Supervised Transformers for Object Discovery

Sai Saketh Rambhatla, Ishan Misra, Rama Chellappa, Abhinav Shrivastava

ICCV 2023 oral

pdf / webpage / code / poster /

BibTeX

@inproceedings{rambhatla2023most,
  title={{MOST: Multiple Object Localization with Self-Supervised Transformers for Object Discovery}},
  author={Rambhatla, Sai Saketh and Misra, Ishan and Chellappa, Rama and Shrivastava, Abhinav},
  booktitle={ICCV},
  year={2023}
  url={https://arxiv.org/abs/2304.05387}
}

SHACIRA: Scalable HAsh-grid Compression for Implicit Neural Representations

Sharath Girish, Abhinav Shrivastava, Kamal Gupta

ICCV 2023

pdf / webpage / code / video / poster /

BibTeX

@inproceedings{girish2023shacira,
  title={{SHACIRA: Scalable HAsh-grid Compression for Implicit Neural Representations}},
  author={Girish, Sharath and Shrivastava, Abhinav and Gupta, Kamal},
  booktitle={ICCV},
  year={2023}
  url={http://arxiv.org/abs/2309.15848}
}

SparseDet: Improving Sparsely Annotated Object Detection with Pseudo-positive Mining

Saksham Suri, Sai Saketh Rambhatla, Rama Chellappa, Abhinav Shrivastava

ICCV 2023

pdf / webpage / code / poster /

BibTeX

@inproceedings{suri2023sparsedet,
  title={{SparseDet: Improving Sparsely Annotated Object Detection with Pseudo-positive Mining}},
  author={Suri, Saksham and Rambhatla, Sai Saketh and Chellappa, Rama and Shrivastava, Abhinav},
  booktitle={ICCV},
  year={2023}
  url={https://arxiv.org/abs/2201.04620}
}

Novelty in Image Classification

Mohsen Jafarzadeh, Akshay Raj Dhamija, Steve Cruz, Chunchun Li, Abhinav Shrivastava, Terrance E. Boult

Springer Book Chapter 2023

BibTeX

@article{jafarzadeh2023novelty,
  title={{Novelty in Image Classification}},
  author={Jafarzadeh, Mohsen and Dhamija, Akshay Raj and Cruz, Steve and Li, Chunchun and Shrivastava, Abhinav and Boult, Terrance E.},
  journal={Springer Book Chapter},
  year={2023}
}

Align and Attend: Multimodal Summarization with Dual Contrastive Losses

Bo He, Jun Wang, Jielin Qiu, Trung Bui, Abhinav Shrivastava, Zhaowen Wang

CVPR 2023

pdf / webpage / code /

BibTeX

@inproceedings{he2023align,
  title={{Align and Attend: Multimodal Summarization with Dual Contrastive Losses}},
  author={He, Bo and Wang, Jun and Qiu, Jielin and Bui, Trung and Shrivastava, Abhinav and Wang, Zhaowen},
  booktitle={CVPR},
  year={2023}
  url={https://arxiv.org/abs/2303.07284}
}

FlexNeRF: Photorealistic Free-viewpoint Rendering of Moving Humans from Sparse Views

Vinoj Jayasundara, Amit Agrawal, Nicolas Heron, Abhinav Shrivastava, Larry Davis

CVPR 2023

pdf / webpage /

BibTeX

@inproceedings{jayasundara2023flexnerf,
  title={{FlexNeRF: Photorealistic Free-viewpoint Rendering of Moving Humans from Sparse Views}},
  author={Jayasundara, Vinoj and Agrawal, Amit and Heron, Nicolas and Shrivastava, Abhinav and Davis, Larry},
  booktitle={CVPR},
  year={2023}
  url={https://arxiv.org/abs/2303.14368}
}

HNeRV: A Hybrid Neural Representation for Videos

Hao Chen, Matthew Gwilliam, Ser-Nam Lim, Abhinav Shrivastava

CVPR 2023

pdf / webpage / code /

BibTeX

@inproceedings{chen2023hnerv,
  title={{HNeRV: A Hybrid Neural Representation for Videos}},
  author={Chen, Hao and Gwilliam, Matthew and Lim, Ser-Nam and Shrivastava, Abhinav},
  booktitle={CVPR},
  year={2023}
  url={https://arxiv.org/abs/2304.02633}
}

NIRVANA: Neural Implicit Representations of Videos with Adaptive Networks and Autoregressive Patch-wise Modeling

Shishira R Maiya, Sharath Girish, Max Ehrlich, Hanyu Wang, Kwot Sin Lee, Patrick Poirson, Pengxiang Wu, Chen Wang, Abhinav Shrivastava

CVPR 2023

pdf / webpage /

BibTeX

@inproceedings{maiya2023nirvana,
  title={{NIRVANA: Neural Implicit Representations of Videos with Adaptive Networks and Autoregressive Patch-wise Modeling}},
  author={Maiya, Shishira R and Girish, Sharath and Ehrlich, Max and Wang, Hanyu and Lee, Kwot Sin and Poirson, Patrick and Wu, Pengxiang and Wang, Chen and Shrivastava, Abhinav},
  booktitle={CVPR},
  year={2023}
  url={https://arxiv.org/abs/2212.14593}
}

SimpSON: Simplifying Photo Cleanup With Single-Click Distracting Object Segmentation Network

Chuong Huynh, Yuqian Zhou, Zhe Lin, Connelly Barnes, Eli Shechtman, Sohrab Amirghodsi, Abhinav Shrivastava

CVPR 2023

pdf / webpage / code / video / poster /

BibTeX

@inproceedings{huynh2023simpson,
  title={{SimpSON: Simplifying Photo Cleanup With Single-Click Distracting Object Segmentation Network}},
  author={Huynh, Chuong and Zhou, Yuqian and Lin, Zhe and Barnes, Connelly and Shechtman, Eli and Amirghodsi, Sohrab and Shrivastava, Abhinav},
  booktitle={CVPR},
  year={2023}
  url={https://openaccess.thecvf.com/content/CVPR2023/html/Huynh_SimpSON_Simplifying_Photo_Cleanup_With_Single-Click_Distracting_Object_Segmentation_Network_CVPR_2023_paper.html}
}

Teaching Matters: Investigating the Role of Supervision in Vision Transformers

Matthew Walmer, Saksham Suri, Kamal Gupta, Abhinav Shrivastava

CVPR 2023

pdf / webpage / code /

BibTeX

@inproceedings{walmer2023teaching,
  title={{Teaching Matters: Investigating the Role of Supervision in Vision Transformers}},
  author={Walmer, Matthew and Suri, Saksham and Gupta, Kamal and Shrivastava, Abhinav},
  booktitle={CVPR},
  year={2023}
  url={https://arxiv.org/abs/2212.03862}
}

Towards Scalable Neural Representation for Diverse Videos

Bo He, Xitong Yang, Hanyu Wang, Zuxuan Wu, Hao Chen, Shuaiyi Huang, Yixuan Ren, Ser-Nam Lim, Abhinav Shrivastava

CVPR 2023

pdf / webpage / code /

BibTeX

@inproceedings{he2023towards,
  title={{Towards Scalable Neural Representation for Diverse Videos}},
  author={He, Bo and Yang, Xitong and Wang, Hanyu and Wu, Zuxuan and Chen, Hao and Huang, Shuaiyi and Ren, Yixuan and Lim, Ser-Nam and Shrivastava, Abhinav},
  booktitle={CVPR},
  year={2023}
  url={https://arxiv.org/abs/2303.14124}
}

COVID-VTS: Fact Extraction and Verification on Short Video Platforms

Fuxiao Liu, Yaser Yacoob, Abhinav Shrivastava

EACL 2023

BibTeX

@inproceedings{liu2023covidvts,
  title={{COVID-VTS: Fact Extraction and Verification on Short Video Platforms}},
  author={Liu, Fuxiao and Yacoob, Yaser and Shrivastava, Abhinav},
  booktitle={EACL},
  year={2023}
}

LilNetX: Lightweight Networks with EXtreme Model Compression and Structured Sparsification

Sharath Girish, Kamal Gupta, Saurabh Singh, Abhinav Shrivastava

ICLR 2023

pdf / webpage / code /

BibTeX

@inproceedings{girish2023lilnetx,
  title={{LilNetX: Lightweight Networks with EXtreme Model Compression and Structured Sparsification}},
  author={Girish, Sharath and Gupta, Kamal and Singh, Saurabh and Shrivastava, Abhinav},
  booktitle={ICLR},
  year={2023}
  url={https://openreview.net/pdf?id=NVZvalzCLg}
}

2022

Burn After Reading: Online Adaptation for Cross-domain Streaming Data

Luyu Yang, Mingfei Gao, Zeyuan Chen, Ran Xu, Abhinav Shrivastava, Chetan Ramaiah

ECCV 2022

pdf / webpage / code /

BibTeX

@inproceedings{yang2022burn,
  title={{Burn After Reading: Online Adaptation for Cross-domain Streaming Data}},
  author={Yang, Luyu and Gao, Mingfei and Chen, Zeyuan and Xu, Ran and Shrivastava, Abhinav and Ramaiah, Chetan},
  booktitle={ECCV},
  year={2022}
  url={https://arxiv.org/abs/2112.04345}
}

Improving Closed and Open Set Attribute Prediction using Transformers

Khoi Pham, Kushal Kafle, Zhe Lin, Zhihong Ding, Scott Cohen, Quan Hung Tran, Abhinav Shrivastava

ECCV 2022

pdf / webpage / code /

BibTeX

@inproceedings{pham2022improving,
  title={{Improving Closed and Open Set Attribute Prediction using Transformers}},
  author={Pham, Khoi and Kafle, Kushal and Lin, Zhe and Ding, Zhihong and Cohen, Scott and Tran, Quan Hung and Shrivastava, Abhinav},
  booktitle={ECCV},
  year={2022}
  url={https://www.ecva.net/papers/eccv_2022/papers_ECCV/papers/136850199.pdf}
}

Learning Semantic Correspondence with Sparse Annotations

Shuaiyi Huang, Luyu Yang, Bo He, Songyang Zhang, Xuming He, Abhinav Shrivastava

ECCV 2022

pdf / webpage / code /

BibTeX

@inproceedings{huang2022learning,
  title={{Learning Semantic Correspondence with Sparse Annotations}},
  author={Huang, Shuaiyi and Yang, Luyu and He, Bo and Zhang, Songyang and He, Xuming and Shrivastava, Abhinav},
  booktitle={ECCV},
  year={2022}
  url={https://arxiv.org/abs/2208.06974}
}

Neural Space-Filling Curves

Hanyu Wang, Kamal Gupta, Larry Davis, Abhinav Shrivastava

ECCV 2022

pdf / webpage / code / poster /

BibTeX

@inproceedings{wang2022neural,
  title={{Neural Space-Filling Curves}},
  author={Wang, Hanyu and Gupta, Kamal and Davis, Larry and Shrivastava, Abhinav},
  booktitle={ECCV},
  year={2022}
  url={https://arxiv.org/abs/2204.08453}
}

ASM-Loc: Action-aware Segment Modeling for Weakly-Supervised Temporal Action Localization

Bo He, Xitong Yang, Le Kang, Zhiyu Cheng, Xin Zhou, Abhinav Shrivastava

CVPR 2022

pdf / webpage / code /

BibTeX

@inproceedings{he2022asmloc,
  title={{ASM-Loc: Action-aware Segment Modeling for Weakly-Supervised Temporal Action Localization}},
  author={He, Bo and Yang, Xitong and Kang, Le and Cheng, Zhiyu and Zhou, Xin and Shrivastava, Abhinav},
  booktitle={CVPR},
  year={2022}
  url={https://arxiv.org/abs/2203.15187}
}

Beyond Supervised vs. Unsupervised: Representative Benchmarking and Analysis of Image Representation Learning

Matthew Gwilliam, Abhinav Shrivastava

CVPR 2022

pdf / webpage / code /

BibTeX

@inproceedings{gwilliam2022beyond,
  title={{Beyond Supervised vs. Unsupervised: Representative Benchmarking and Analysis of Image Representation Learning}},
  author={Gwilliam, Matthew and Shrivastava, Abhinav},
  booktitle={CVPR},
  year={2022}
  url={https://arxiv.org/abs/2206.08347}
}

Disentangling Visual Embeddings for Attributes and Objects

Nirat Saini, Khoi Pham, Abhinav Shrivastava

CVPR 2022 oral

pdf / webpage / code /

BibTeX

@inproceedings{saini2022disentangling,
  title={{Disentangling Visual Embeddings for Attributes and Objects}},
  author={Saini, Nirat and Pham, Khoi and Shrivastava, Abhinav},
  booktitle={CVPR},
  year={2022}
  url={https://arxiv.org/abs/2205.08536}
}

Dual-Key Multimodal Backdoors for Visual Question Answering

Matthew Walmer, Karan Sikka, Indranil Sur, Abhinav Shrivastava, Susmit Jha

CVPR 2022

pdf / code / demo /

BibTeX

@inproceedings{walmer2022dualkey,
  title={{Dual-Key Multimodal Backdoors for Visual Question Answering}},
  author={Walmer, Matthew and Sikka, Karan and Sur, Indranil and Shrivastava, Abhinav and Jha, Susmit},
  booktitle={CVPR},
  year={2022}
  url={https://arxiv.org/abs/2112.07668}
}

ObjectFormer for Image Manipulation Detection and Localization

Junke Wang, Zuxuan Wu, Jingjing Chen, Xintong Han, Abhinav Shrivastava, Ser-Nam Lim, Yu-Gang Jiang

CVPR 2022

pdf /

BibTeX

@inproceedings{wang2022objectformer,
  title={{ObjectFormer for Image Manipulation Detection and Localization}},
  author={Wang, Junke and Wu, Zuxuan and Chen, Jingjing and Han, Xintong and Shrivastava, Abhinav and Lim, Ser-Nam and Jiang, Yu-Gang},
  booktitle={CVPR},
  year={2022}
  url={https://arxiv.org/abs/2203.14681}
}

Pose And Joint-Aware Action Recognition

Anshul Shah, Shlok Mishra, Ankan Bansal, Jun-Cheng Chen, Rama Chellappa, Abhinav Shrivastava

WACV 2022

pdf / code / video /

BibTeX

@inproceedings{shah2022pose,
  title={{Pose And Joint-Aware Action Recognition}},
  author={Shah, Anshul and Mishra, Shlok and Bansal, Ankan and Chen, Jun-Cheng and Chellappa, Rama and Shrivastava, Abhinav},
  booktitle={WACV},
  year={2022}
  url={https://arxiv.org/abs/2010.08164}
}

Rethinking Pseudo Labels for Semi-Supervised Object Detection

Hengduo Li, Zuxuan Wu, Abhinav Shrivastava, Larry Davis

AAAI 2022

pdf /

BibTeX

@inproceedings{li2022rethinking,
  title={{Rethinking Pseudo Labels for Semi-Supervised Object Detection}},
  author={Li, Hengduo and Wu, Zuxuan and Shrivastava, Abhinav and Davis, Larry},
  booktitle={AAAI},
  year={2022}
  url={https://arxiv.org/abs/2106.00168}
}

2021

NeRV: Neural Representations for Videos

Hao Chen, Bo He, Hanyu Wang, Yixuan Ren, Ser-Nam Lim, Abhinav Shrivastava

NeurIPS 2021

pdf / webpage / code /

BibTeX

@inproceedings{chen2021nerv,
  title={{NeRV: Neural Representations for Videos}},
  author={Chen, Hao and He, Bo and Wang, Hanyu and Ren, Yixuan and Lim, Ser-Nam and Shrivastava, Abhinav},
  booktitle={NeurIPS},
  year={2021}
  url={https://arxiv.org/abs/2110.13903}
}

PatchGame: Learning to Signal Mid-level Patches in Referential Games

Kamal Gupta, Gowthami Somepalli, Anubhav, Vinoj Jayasundara, Matthias Zwicker, Abhinav Shrivastava

NeurIPS 2021

pdf / webpage / code / video /

BibTeX

@inproceedings{gupta2021patchgame,
  title={{PatchGame: Learning to Signal Mid-level Patches in Referential Games}},
  author={Gupta, Kamal and Somepalli, Gowthami and Anubhav and Jayasundara, Vinoj and Zwicker, Matthias and Shrivastava, Abhinav},
  booktitle={NeurIPS},
  year={2021}
  url={https://arxiv.org/abs/2111.01785}
}

Deep Co-Training with Task Decomposition for Semi-Supervised Domain Adaptation

Luyu Yang, Yan Wang, Mingfei Gao, Abhinav Shrivastava, Kilian Weinberger, Wei-Lun Chao, Ser-Nam Lim

ICCV 2021

pdf / code /

BibTeX

@inproceedings{yang2021deep,
  title={{Deep Co-Training with Task Decomposition for Semi-Supervised Domain Adaptation}},
  author={Yang, Luyu and Wang, Yan and Gao, Mingfei and Shrivastava, Abhinav and Weinberger, Kilian and Chao, Wei-Lun and Lim, Ser-Nam},
  booktitle={ICCV},
  year={2021}
  url={https://openaccess.thecvf.com/content/ICCV2021/papers/Yang_Deep_Co-Training_With_Task_Decomposition_for_Semi-Supervised_Domain_Adaptation_ICCV_2021_paper.pdf}
}

Deep Video Inpainting Detection

Peng Zhou, Ning Yu, Zuxuan Wu, Larry Davis, Abhinav Shrivastava, Ser-Nam Lim

BMVC 2021

pdf / video /

BibTeX

@inproceedings{zhou2021deep,
  title={{Deep Video Inpainting Detection}},
  author={Zhou, Peng and Yu, Ning and Wu, Zuxuan and Davis, Larry and Shrivastava, Abhinav and Lim, Ser-Nam},
  booktitle={BMVC},
  year={2021}
  url={https://arxiv.org/abs/2101.11080}
}

GTA: Global Temporal Attention for Video Action Understanding

Bo He, Xitong Yang, Zuxuan Wu, Hao Chen, Ser-Nam Lim, Abhinav Shrivastava

BMVC 2021

pdf / video /

BibTeX

@inproceedings{he2021gta,
  title={{GTA: Global Temporal Attention for Video Action Understanding}},
  author={He, Bo and Yang, Xitong and Wu, Zuxuan and Chen, Hao and Lim, Ser-Nam and Shrivastava, Abhinav},
  booktitle={BMVC},
  year={2021}
  url={https://arxiv.org/abs/2012.08510}
}

HR-RCNN: Hierarchical Relational Reasoning for Object Detection

Hao Chen, Abhinav Shrivastava

BMVC 2021

pdf / video /

BibTeX

@inproceedings{chen2021hrrcnn,
  title={{HR-RCNN: Hierarchical Relational Reasoning for Object Detection}},
  author={Chen, Hao and Shrivastava, Abhinav},
  booktitle={BMVC},
  year={2021}
  url={https://arxiv.org/abs/2110.13892}
}

Layout Generation and Completion with Self-attention

Kamal Gupta, Alessandro Achille, Justin Lazarow, Larry Davis, Vijay Mahadevan, Abhinav Shrivastava

ICCV 2021

pdf / webpage / code /

BibTeX

@inproceedings{gupta2021layout,
  title={{Layout Generation and Completion with Self-attention}},
  author={Gupta, Kamal and Achille, Alessandro and Lazarow, Justin and Davis, Larry and Mahadevan, Vijay and Shrivastava, Abhinav},
  booktitle={ICCV},
  year={2021}
  url={https://arxiv.org/abs/2006.14615}
}

Learned Spatial Representations for Few-shot Talking-Head Synthesis

Moustafa Meshry, Saksham Suri, Larry Davis, Abhinav Shrivastava

ICCV 2021

pdf / webpage / code / video /

BibTeX

@inproceedings{meshry2021learned,
  title={{Learned Spatial Representations for Few-shot Talking-Head Synthesis}},
  author={Meshry, Moustafa and Suri, Saksham and Davis, Larry and Shrivastava, Abhinav},
  booktitle={ICCV},
  year={2021}
  url={https://arxiv.org/abs/2104.14557}
}

The Pursuit of Knowledge: Discovering and Localizing Novel Categories using Dual Memory

Sai Saketh Rambhatla, Rama Chellappa, Abhinav Shrivastava

ICCV 2021

pdf / webpage /

BibTeX

@inproceedings{rambhatla2021the,
  title={{The Pursuit of Knowledge: Discovering and Localizing Novel Categories using Dual Memory}},
  author={Rambhatla, Sai Saketh and Chellappa, Rama and Shrivastava, Abhinav},
  booktitle={ICCV},
  year={2021}
  url={https://arxiv.org/abs/2105.01652}
}

Towards Discovery and Attribution of Open-world GAN Generated Images

Sharath Girish, Saksham Suri, Sai Saketh Rambhatla, Abhinav Shrivastava

ICCV 2021

pdf / webpage /

BibTeX

@inproceedings{girish2021towards,
  title={{Towards Discovery and Attribution of Open-world GAN Generated Images}},
  author={Girish, Sharath and Suri, Saksham and Rambhatla, Sai Saketh and Shrivastava, Abhinav},
  booktitle={ICCV},
  year={2021}
  url={http://www.cs.umd.edu/~sakshams/project_page/resources/full_paper.pdf}
}

Leveraging Hand-Object Interactions in Assistive Egocentric Vision

Kyungjun Lee, Abhinav Shrivastava, Hernisa Kacorri

TPAMI 2021

pdf /

BibTeX

@article{lee2021leveraging,
  title={{Leveraging Hand-Object Interactions in Assistive Egocentric Vision}},
  author={Lee, Kyungjun and Shrivastava, Abhinav and Kacorri, Hernisa},
  journal={TPAMI},
  year={2021}
  url={https://ieeexplore.ieee.org/document/9591443}
}

2D or not 2D? Adaptive 3D Convolution Selection for Efficient Video Recognition

Hengduo Li, Zuxuan Wu, Abhinav Shrivastava, Larry Davis

CVPR 2021

pdf /

BibTeX

@inproceedings{li2021d,
  title={{2D or not 2D? Adaptive 3D Convolution Selection for Efficient Video Recognition}},
  author={Li, Hengduo and Wu, Zuxuan and Shrivastava, Abhinav and Davis, Larry},
  booktitle={CVPR},
  year={2021}
  url={https://arxiv.org/abs/2012.14950}
}

Hierarchical Video Prediction for Human Object Interaction

Navaneeth Bodla, Gaurav Shrivastava, Rama Chellappa, Abhinav Shrivastava

CVPR 2021

pdf / webpage / video /

BibTeX

@inproceedings{bodla2021hierarchical,
  title={{Hierarchical Video Prediction for Human Object Interaction}},
  author={Bodla, Navaneeth and Shrivastava, Gaurav and Chellappa, Rama and Shrivastava, Abhinav},
  booktitle={CVPR},
  year={2021}
  url={https://horn-video.github.io/camera_ready.pdf}
}

Knowledge Evolution in Neural Networks

Ahmed Taha, Abhinav Shrivastava, Larry Davis

CVPR 2021 oral

pdf / webpage / code / blog /

BibTeX

@inproceedings{taha2021knowledge,
  title={{Knowledge Evolution in Neural Networks}},
  author={Taha, Ahmed and Shrivastava, Abhinav and Davis, Larry},
  booktitle={CVPR},
  year={2021}
  url={https://arxiv.org/abs/2103.05152}
}

Learning Graphs for Knowledge Transfer with Limited Labels

Pallabi Ghosh, Nirat Saini, Larry Davis, Abhinav Shrivastava

CVPR 2021

pdf / webpage / code / video /

BibTeX

@inproceedings{ghosh2021learning,
  title={{Learning Graphs for Knowledge Transfer with Limited Labels}},
  author={Ghosh, Pallabi and Saini, Nirat and Davis, Larry and Shrivastava, Abhinav},
  booktitle={CVPR},
  year={2021}
  url={https://openaccess.thecvf.com/content/CVPR2021/papers/Ghosh_Learning_Graphs_for_Knowledge_Transfer_With_Limited_Labels_CVPR_2021_paper.pdf}
}

Learning to Predict Visual Attributes in the Wild

Khoi Pham, Kushal Kafle, Zhe Lin, Zhihong Ding, Scott Cohen, Quan Hung Tran, Abhinav Shrivastava

CVPR 2021

pdf / webpage / code / demo /

BibTeX

@inproceedings{pham2021learning,
  title={{Learning to Predict Visual Attributes in the Wild}},
  author={Pham, Khoi and Kafle, Kushal and Lin, Zhe and Ding, Zhihong and Cohen, Scott and Tran, Quan Hung and Shrivastava, Abhinav},
  booktitle={CVPR},
  year={2021}
  url={http://arxiv.org/abs/2106.09707}
}

Style-based Encoder Pre-training for Multi-modal Image Synthesis

Moustafa Meshry, Yixuan Ren, Larry Davis, Abhinav Shrivastava

CVPR 2021

pdf / webpage / code /

BibTeX

@inproceedings{meshry2021stylebased,
  title={{Style-based Encoder Pre-training for Multi-modal Image Synthesis}},
  author={Meshry, Moustafa and Ren, Yixuan and Davis, Larry and Shrivastava, Abhinav},
  booktitle={CVPR},
  year={2021}
  url={https://www.cs.umd.edu/~mmeshry/projects/step/resources/step_cvpr2021-full.pdf}
}

The Lottery Ticket Hypothesis for Object Recognition

Sharath Girish, Shishira R Maiya, Kamal Gupta, Hao Chen, Larry Davis, Abhinav Shrivastava

CVPR 2021

pdf / webpage / code /

BibTeX

@inproceedings{girish2021the,
  title={{The Lottery Ticket Hypothesis for Object Recognition}},
  author={Girish, Sharath and Maiya, Shishira R and Gupta, Kamal and Chen, Hao and Davis, Larry and Shrivastava, Abhinav},
  booktitle={CVPR},
  year={2021}
  url={https://arxiv.org/abs/2012.04643}
}

Diverse Video Generation using a Gaussian Process Trigger

Gaurav Shrivastava, Abhinav Shrivastava

ICLR 2021

pdf / webpage / code /

BibTeX

@inproceedings{shrivastava2021diverse,
  title={{Diverse Video Generation using a Gaussian Process Trigger}},
  author={Shrivastava, Gaurav and Shrivastava, Abhinav},
  booktitle={ICLR},
  year={2021}
  url={https://openreview.net/forum?id=Qm7R_SdqTpT}
}

No-frills Dynamic Planning using Static Planners

Mara Levy, Vasista Ayyagari, Abhinav Shrivastava

ICRA 2021

pdf / webpage / video /

BibTeX

@inproceedings{levy2021nofrills,
  title={{No-frills Dynamic Planning using Static Planners}},
  author={Levy, Mara and Ayyagari, Vasista and Shrivastava, Abhinav},
  booktitle={ICRA},
  year={2021}
  url={https://mlevy2525.github.io/files/DynamicPlanningAddOn.pdf}
}

A Unifying Framework for Formal Theories of Novelty

Terrance E. Boult, Przemyslaw A. Grabowicz, Derek S. Prijatelj, Roni Stern, Lawrence Holder, Joshua Alspector, Mohsen Jafarzadeh, Touqeer Ahmad, Akshay Raj Dhamija, Chunchun Li, Steve Cruz, Abhinav Shrivastava, Carl Vondrick, Walter J. Scheirer

AAAI 2021 BlueSky talk

pdf /

BibTeX

@inproceedings{boult2021a,
  title={{A Unifying Framework for Formal Theories of Novelty}},
  author={Boult, Terrance E. and Grabowicz, Przemyslaw A. and Prijatelj, Derek S. and Stern, Roni and Holder, Lawrence and Alspector, Joshua and Jafarzadeh, Mohsen and Ahmad, Touqeer and Dhamija, Akshay Raj and Li, Chunchun and Cruz, Steve and Shrivastava, Abhinav and Vondrick, Carl and Scheirer, Walter J.},
  booktitle={AAAI},
  year={2021}
  url={https://ojs.aaai.org/index.php/AAAI/article/view/17766/17573}
}

2020

All About Knowledge Graphs for Actions

Pallabi Ghosh, Nirat Saini, Larry Davis, Abhinav Shrivastava

arXiv 2020

pdf /

BibTeX

@article{ghosh2020all,
  title={{All About Knowledge Graphs for Actions}},
  author={Ghosh, Pallabi and Saini, Nirat and Davis, Larry and Shrivastava, Abhinav},
  journal={arXiv},
  year={2020}
  url={https://arxiv.org/abs/2008.12432}
}

A Generic Visualization Approach for Convolutional Neural Networks

Ahmed Taha, Xitong Yang, Abhinav Shrivastava, Larry Davis

ECCV 2020

pdf / webpage / code / video /

BibTeX

@inproceedings{taha2020a,
  title={{A Generic Visualization Approach for Convolutional Neural Networks}},
  author={Taha, Ahmed and Yang, Xitong and Shrivastava, Abhinav and Davis, Larry},
  booktitle={ECCV},
  year={2020}
  url={https://arxiv.org/abs/2007.09748}
}

Curriculum Manager for Source Selection in Multi-Source Domain Adaptation

Luyu Yang, Yogesh Balaji, Ser-Nam Lim, Abhinav Shrivastava

ECCV 2020

pdf /

BibTeX

@inproceedings{yang2020curriculum,
  title={{Curriculum Manager for Source Selection in Multi-Source Domain Adaptation}},
  author={Yang, Luyu and Balaji, Yogesh and Lim, Ser-Nam and Shrivastava, Abhinav},
  booktitle={ECCV},
  year={2020}
  url={https://arxiv.org/abs/2007.01261}
}

Depth Completion using a View-constrained Deep Prior

Pallabi Ghosh, Vibhav Vineet, Larry Davis, Abhinav Shrivastava, Sudipta Sinha, Neel Joshi

3DV 2020

pdf /

BibTeX

@inproceedings{ghosh2020depth,
  title={{Depth Completion using a View-constrained Deep Prior}},
  author={Ghosh, Pallabi and Vineet, Vibhav and Davis, Larry and Shrivastava, Abhinav and Sinha, Sudipta and Joshi, Neel},
  booktitle={3DV},
  year={2020}
  url={https://arxiv.org/abs/2001.07791}
}

Group Ensemble: Learning an Ensemble of ConvNets in a single ConvNet

Hao Chen, Abhinav Shrivastava

arXiv 2020

pdf / code /

BibTeX

@article{chen2020group,
  title={{Group Ensemble: Learning an Ensemble of ConvNets in a single ConvNet}},
  author={Chen, Hao and Shrivastava, Abhinav},
  journal={arXiv},
  year={2020}
  url={https://arxiv.org/pdf/2007.00649.pdf}
}

Improved Modeling of 3D Shapes with Multi-view Depth Maps

Kamal Gupta, Susmija Jabbireddy, Ketul Shah, Abhinav Shrivastava, Matthias Zwicker

3DV 2020 oral

pdf / webpage / code / video /

BibTeX

@inproceedings{gupta2020improved,
  title={{Improved Modeling of 3D Shapes with Multi-view Depth Maps}},
  author={Gupta, Kamal and Jabbireddy, Susmija and Shah, Ketul and Shrivastava, Abhinav and Zwicker, Matthias},
  booktitle={3DV},
  year={2020}
  url={https://arxiv.org/abs/2009.03298}
}

Quantization Guided JPEG Artifact Correction

Max Ehrlich, Ser-Nam Lim, Larry Davis, Abhinav Shrivastava

ECCV 2020

pdf / code / video /

BibTeX

@inproceedings{ehrlich2020quantization,
  title={{Quantization Guided JPEG Artifact Correction}},
  author={Ehrlich, Max and Lim, Ser-Nam and Davis, Larry and Shrivastava, Abhinav},
  booktitle={ECCV},
  year={2020}
  url={https://arxiv.org/abs/2004.09320}
}

End-to-end Learning of Compressible Features

Saurabh Singh, Sami Abu-El-Haija, Nick Johnston, Johannes Balle, Abhinav Shrivastava, George Toderici

ICIP 2020

pdf /

BibTeX

@inproceedings{singh2020endtoend,
  title={{End-to-end Learning of Compressible Features}},
  author={Singh, Saurabh and Abu-El-Haija, Sami and Johnston, Nick and Balle, Johannes and Shrivastava, Abhinav and Toderici, George},
  booktitle={ICIP},
  year={2020}
  url={https://arxiv.org/abs/2007.11797}
}

PatchVAE: Learning Local Latent Codes for Recognition

Kamal Gupta, Saurabh Singh, Abhinav Shrivastava

CVPR 2020

pdf / webpage / code / video /

BibTeX

@inproceedings{gupta2020patchvae,
  title={{PatchVAE: Learning Local Latent Codes for Recognition}},
  author={Gupta, Kamal and Singh, Saurabh and Shrivastava, Abhinav},
  booktitle={CVPR},
  year={2020}
  url={https://arxiv.org/abs/2004.03623}
}

Scalable Model Compression by Entropy Penalized Reparameterization

Deniz Oktay, Johannes Balle, Saurabh Singh, Abhinav Shrivastava

ICLR 2020

pdf /

BibTeX

@inproceedings{oktay2020scalable,
  title={{Scalable Model Compression by Entropy Penalized Reparameterization}},
  author={Oktay, Deniz and Balle, Johannes and Singh, Saurabh and Shrivastava, Abhinav},
  booktitle={ICLR},
  year={2020}
  url={https://openreview.net/pdf?id=HkgxW0EYDS}
}

Boosting Standard Classification Architectures Through a Ranking Regularizer

Ahmed Taha, Yi-Ting Chen, Teruhisa Misu, Abhinav Shrivastava, Larry Davis

WACV 2020

pdf / webpage / code /

BibTeX

@inproceedings{taha2020boosting,
  title={{Boosting Standard Classification Architectures Through a Ranking Regularizer}},
  author={Taha, Ahmed and Chen, Yi-Ting and Misu, Teruhisa and Shrivastava, Abhinav and Davis, Larry},
  booktitle={WACV},
  year={2020}
  url={http://openaccess.thecvf.com/content_WACV_2020/papers/Taha_Boosting_Standard_Classification_Architectures_Through_a_Ranking_Regularizer_WACV_2020_paper.pdf}
}

Hand-Priming in Object Localization for Assistive Egocentric Vision

Kyungjun Lee, Abhinav Shrivastava, Hernisa Kacorri

WACV 2020 oralbest paper award

pdf / video /

BibTeX

@inproceedings{lee2020handpriming,
  title={{Hand-Priming in Object Localization for Assistive Egocentric Vision}},
  author={Lee, Kyungjun and Shrivastava, Abhinav and Kacorri, Hernisa},
  booktitle={WACV},
  year={2020}
  url={https://arxiv.org/pdf/2002.12557.pdf}
}

Detecting Human-Object Interactions via Functional Generalization

Ankan Bansal, Sai Saketh Rambhatla, Abhinav Shrivastava, Rama Chellappa

AAAI 2020

pdf /

BibTeX

@inproceedings{bansal2020detecting,
  title={{Detecting Human-Object Interactions via Functional Generalization}},
  author={Bansal, Ankan and Rambhatla, Sai Saketh and Shrivastava, Abhinav and Chellappa, Rama},
  booktitle={AAAI},
  year={2020}
  url={https://arxiv.org/pdf/1904.03181.pdf}
}

Generate, Segment and Refine: Towards Generic Manipulation Segmentation

Peng Zhou, Bor-Chun Chen, Xintong Han, Mahyar Najibi, Abhinav Shrivastava, Ser-Nam Lim, Larry Davis

AAAI 2020

pdf / code /

BibTeX

@inproceedings{zhou2020generate,
  title={{Generate, Segment and Refine: Towards Generic Manipulation Segmentation}},
  author={Zhou, Peng and Chen, Bor-Chun and Han, Xintong and Najibi, Mahyar and Shrivastava, Abhinav and Lim, Ser-Nam and Davis, Larry},
  booktitle={AAAI},
  year={2020}
  url={https://arxiv.org/pdf/1811.09729.pdf}
}

2019

Render4Completion: Synthesizing Multi-view Depth Maps for 3D Shape Completion

Tao Hu, Zhizhong Han, Abhinav Shrivastava, Matthias Zwicker

GeoMDL Workshop, ICCV 2019

pdf /

BibTeX

@inproceedings{hu2019rendercompletion,
  title={{Render4Completion: Synthesizing Multi-view Depth Maps for 3D Shape Completion}},
  author={Hu, Tao and Han, Zhizhong and Shrivastava, Abhinav and Zwicker, Matthias},
  booktitle={GeoMDL Workshop, ICCV},
  year={2019}
  url={https://arxiv.org/pdf/1904.08366.pdf}
}

EvalNorm: Estimating Batch Normalization Statistics for Evaluation

Saurabh Singh, Abhinav Shrivastava

ICCV 2019

pdf /

BibTeX

@inproceedings{singh2019evalnorm,
  title={{EvalNorm: Estimating Batch Normalization Statistics for Evaluation}},
  author={Singh, Saurabh and Shrivastava, Abhinav},
  booktitle={ICCV},
  year={2019}
  url={https://arxiv.org/pdf/1904.06031.pdf}
}

Relational Action Forecasting

Chen Sun, Abhinav Shrivastava, Carl Vondrick, Rahul Sukthankar, Kevin Murphy, Cordelia Schmid

CVPR 2019 best paper finalist

pdf /

BibTeX

@inproceedings{sun2019relational,
  title={{Relational Action Forecasting}},
  author={Sun, Chen and Shrivastava, Abhinav and Vondrick, Carl and Sukthankar, Rahul and Murphy, Kevin and Schmid, Cordelia},
  booktitle={CVPR},
  year={2019}
  url={https://arxiv.org/pdf/1904.04231.pdf}
}

2018

Actor-centric Relation Network

Chen Sun, Abhinav Shrivastava, Carl Vondrick, Kevin Murphy, Rahul Sukthankar, Cordelia Schmid

ECCV 2018

pdf /

BibTeX

@inproceedings{sun2018actorcentric,
  title={{Actor-centric Relation Network}},
  author={Sun, Chen and Shrivastava, Abhinav and Vondrick, Carl and Murphy, Kevin and Sukthankar, Rahul and Schmid, Cordelia},
  booktitle={ECCV},
  year={2018}
  url={https://arxiv.org/pdf/1807.10982.pdf}
}

Tracking Emerges by Colorizing Videos

Carl Vondrick, Abhinav Shrivastava, Alireza Fathi, Sergio Guadarrama, Kevin Murphy

ECCV 2018

pdf /

BibTeX

@inproceedings{vondrick2018tracking,
  title={{Tracking Emerges by Colorizing Videos}},
  author={Vondrick, Carl and Shrivastava, Abhinav and Fathi, Alireza and Guadarrama, Sergio and Murphy, Kevin},
  booktitle={ECCV},
  year={2018}
  url={https://arxiv.org/pdf/1806.09594.pdf}
}

2017

Revisiting Unreasonable Effectiveness of Data in Deep Learning Era

Chen Sun, Abhinav Shrivastava, Saurabh Singh, Abhinav Gupta

ICCV 2017 spotlight

pdf /

BibTeX

@inproceedings{sun2017revisiting,
  title={{Revisiting Unreasonable Effectiveness of Data in Deep Learning Era}},
  author={Sun, Chen and Shrivastava, Abhinav and Singh, Saurabh and Gupta, Abhinav},
  booktitle={ICCV},
  year={2017}
  url={https://arxiv.org/pdf/1707.02968}
}

A-Fast-RCNN: Hard Positive Generation via Adversary for Object Detection

Xiaolong Wang, Abhinav Shrivastava, Abhinav Gupta

CVPR 2017

pdf / code /

BibTeX

@inproceedings{wang2017afastrcnn,
  title={{A-Fast-RCNN: Hard Positive Generation via Adversary for Object Detection}},
  author={Wang, Xiaolong and Shrivastava, Abhinav and Gupta, Abhinav},
  booktitle={CVPR},
  year={2017}
  url={https://arxiv.org/pdf/1704.03414.pdf}
}

2016

Beyond Skip Connections: Top-Down Modulation for Object Detection

Abhinav Shrivastava, Rahul Sukthankar, Jitendra Malik, Abhinav Gupta

arXiv 2016

pdf /

BibTeX

@article{shrivastava2016beyond,
  title={{Beyond Skip Connections: Top-Down Modulation for Object Detection}},
  author={Shrivastava, Abhinav and Sukthankar, Rahul and Malik, Jitendra and Gupta, Abhinav},
  journal={arXiv},
  year={2016}
  url={https://arxiv.org/pdf/1612.06851}
}

Contextual Priming and Feedback for Faster R-CNN

Abhinav Shrivastava, Abhinav Gupta

ECCV 2016

pdf / poster /

BibTeX

@inproceedings{shrivastava2016contextual,
  title={{Contextual Priming and Feedback for Faster R-CNN}},
  author={Shrivastava, Abhinav and Gupta, Abhinav},
  booktitle={ECCV},
  year={2016}
  url={https://link.springer.com/content/pdf/10.1007/978-3-319-46448-0_20.pdf}
}

Cross-stitch Networks for Multi-task Learning

Ishan Misra, Abhinav Shrivastava, Abhinav Gupta, Martial Hebert

CVPR 2016 spotlight

pdf / poster / slides /

BibTeX

@inproceedings{misra2016crossstitch,
  title={{Cross-stitch Networks for Multi-task Learning}},
  author={Misra, Ishan and Shrivastava, Abhinav and Gupta, Abhinav and Hebert, Martial},
  booktitle={CVPR},
  year={2016}
  url={https://arxiv.org/abs/1604.03539}
}

Training Region-based Object Detectors with Online Hard Example Mining

Abhinav Shrivastava, Abhinav Gupta, Ross Girshick

CVPR 2016 oral

pdf / code / video / poster / slides /

BibTeX

@inproceedings{shrivastava2016training,
  title={{Training Region-based Object Detectors with Online Hard Example Mining}},
  author={Shrivastava, Abhinav and Gupta, Abhinav and Girshick, Ross},
  booktitle={CVPR},
  year={2016}
  url={https://arxiv.org/abs/1604.03540}
}

2015

Applying artificial vision models to human scene understanding

Elissa M. Aminoff, Mariya Toneva, Abhinav Shrivastava, Xinlei Chen, Ishan Misra, Abhinav Gupta, Michael Tarr

Frontiers in Computational Neuroscience 2015

pdf /

BibTeX

@article{aminoff2015applying,
  title={{Applying artificial vision models to human scene understanding}},
  author={Aminoff, Elissa M. and Toneva, Mariya and Shrivastava, Abhinav and Chen, Xinlei and Misra, Ishan and Gupta, Abhinav and Tarr, Michael},
  journal={Frontiers in Computational Neuroscience},
  year={2015}
  url={http://journal.frontiersin.org/Journal/10.3389/fncom.2015.00008/pdf}
}

Mid-level Elements for Object Detection

Aayush Bansal, Abhinav Shrivastava, Carl Doersch, Abhinav Gupta

arXiv 2015

pdf / supplement /

BibTeX

@article{bansal2015midlevel,
  title={{Mid-level Elements for Object Detection}},
  author={Bansal, Aayush and Shrivastava, Abhinav and Doersch, Carl and Gupta, Abhinav},
  journal={arXiv},
  year={2015}
  url={http://arxiv.org/pdf/1504.07284}
}

Watch and Learn: Semi-supervised Learning of Object Detectors from Videos

Ishan Misra, Abhinav Shrivastava, Martial Hebert

CVPR 2015

pdf / webpage / poster /

BibTeX

@inproceedings{misra2015watch,
  title={{Watch and Learn: Semi-supervised Learning of Object Detectors from Videos}},
  author={Misra, Ishan and Shrivastava, Abhinav and Hebert, Martial},
  booktitle={CVPR},
  year={2015}
  url={https://arxiv.org/abs/1505.05769}
}

2014

Enriching Visual Knowledge Bases via Object Discovery and Segmentation

Xinlei Chen, Abhinav Shrivastava, Abhinav Gupta

CVPR 2014

pdf / webpage / code / poster / supplement /

BibTeX

@inproceedings{chen2014enriching,
  title={{Enriching Visual Knowledge Bases via Object Discovery and Segmentation}},
  author={Chen, Xinlei and Shrivastava, Abhinav and Gupta, Abhinav},
  booktitle={CVPR},
  year={2014}
  url={http://xinleic.xyz/papers/cvpr14.pdf}
}

Data-driven Exemplar Model Selection

Ishan Misra, Abhinav Shrivastava, Martial Hebert

WACV 2014 oralbest student paper award

pdf / webpage / slides /

BibTeX

@inproceedings{misra2014datadriven,
  title={{Data-driven Exemplar Model Selection}},
  author={Misra, Ishan and Shrivastava, Abhinav and Hebert, Martial},
  booktitle={WACV},
  year={2014}
  url={http://www.cs.cmu.edu/~imisra/projects/budgetedDet/selection-wacv-2014.pdf}
}

2013

Building Part-based Object Detectors via 3D Geometry

Abhinav Shrivastava, Abhinav Gupta

ICCV 2013

pdf / webpage /

BibTeX

@inproceedings{shrivastava2013building,
  title={{Building Part-based Object Detectors via 3D Geometry}},
  author={Shrivastava, Abhinav and Gupta, Abhinav},
  booktitle={ICCV},
  year={2013}
  url={http://graphics.cs.cmu.edu/projects/gdpm/gDPM.pdf}
}

NEIL: Extracting Visual Knowledge from Web Data

Xinlei Chen, Abhinav Shrivastava, Abhinav Gupta

ICCV 2013 oral

pdf / webpage / code / video / poster / slides /

BibTeX

@inproceedings{chen2013neil,
  title={{NEIL: Extracting Visual Knowledge from Web Data}},
  author={Chen, Xinlei and Shrivastava, Abhinav and Gupta, Abhinav},
  booktitle={ICCV},
  year={2013}
  url={http://xinleic.xyz/papers/iccv13.pdf}
}

HOG and Spatial Convolution on SIMD Architecture

Ishan Misra, Abhinav Shrivastava, Martial Hebert

CMU Technical Report 2013

pdf / code /

BibTeX

@article{misra2013hog,
  title={{HOG and Spatial Convolution on SIMD Architecture}},
  author={Misra, Ishan and Shrivastava, Abhinav and Hebert, Martial},
  journal={CMU Technical Report},
  year={2013}
  url={http://www.cs.cmu.edu/~imisra/projects/simd-hog-tech-report.pdf}
}

Measuring and Increasing the capacity of Natural HOG Statistics

Tinghui Zhou, Abhinav Shrivastava, Guillaume Obozinski, Abhinav Gupta, Alexei A. Efros

CMU Technical Report 2013

pdf /

BibTeX

@article{zhou2013measuring,
  title={{Measuring and Increasing the capacity of Natural HOG Statistics}},
  author={Zhou, Tinghui and Shrivastava, Abhinav and Obozinski, Guillaume and Gupta, Abhinav and Efros, Alexei A.},
  journal={CMU Technical Report},
  year={2013}
  url={https://arxiv.org/abs/1505.05232}
}

2012

Constrained Semi-Supervised Learning using Attributes and Comparative Attributes

Abhinav Shrivastava, Saurabh Singh, Abhinav Gupta

ECCV 2012 oral

pdf / webpage / video / slides /

BibTeX

@inproceedings{shrivastava2012constrained,
  title={{Constrained Semi-Supervised Learning using Attributes and Comparative Attributes}},
  author={Shrivastava, Abhinav and Singh, Saurabh and Gupta, Abhinav},
  booktitle={ECCV},
  year={2012}
  url={http://graphics.cs.cmu.edu/projects/constrainedSSL/SSL.pdf}
}

Exemplar-SVMs for Visual Object Detection, Label Transfer and Image Retrieval

Tomasz Malisiewicz, Abhinav Shrivastava, Abhinav Gupta, Alexei A. Efros

ICML 2012

pdf / slides /

BibTeX

@inproceedings{malisiewicz2012exemplarsvms,
  title={{Exemplar-SVMs for Visual Object Detection, Label Transfer and Image Retrieval}},
  author={Malisiewicz, Tomasz and Shrivastava, Abhinav and Gupta, Abhinav and Efros, Alexei A.},
  booktitle={ICML},
  year={2012}
  url={http://www.cs.cmu.edu/~tmalisie/projects/iccv11/malisiewicz_icml2012_abstract.pdf}
}

Real-time Household Object Detection from First-person's view using Exemplar-SVMs

Abhinav Shrivastava, Abhinav Gupta, Alexei A. Efros

Ego-Vision Workshop, CVPR 2012

webpage /

BibTeX

@inproceedings{shrivastava2012realtime,
  title={{Real-time Household Object Detection from First-person's view using Exemplar-SVMs}},
  author={Shrivastava, Abhinav and Gupta, Abhinav and Efros, Alexei A.},
  booktitle={Ego-Vision Workshop, CVPR},
  year={2012}
  url={https://www.cs.umd.edu/~abhinav/backup/googleAI/}
}

2011

Data-driven Visual Similarity for Cross-domain Image Matching

Abhinav Shrivastava, Tomasz Malisiewicz, Abhinav Gupta, Alexei A. Efros

SIGGRAPH Asia 2011 oral

pdf / webpage / code / video / slides / data / supplement /

BibTeX

@inproceedings{shrivastava2011datadriven,
  title={{Data-driven Visual Similarity for Cross-domain Image Matching}},
  author={Shrivastava, Abhinav and Malisiewicz, Tomasz and Gupta, Abhinav and Efros, Alexei A.},
  booktitle={SIGGRAPH Asia},
  year={2011}
  url={http://graphics.cs.cmu.edu/projects/crossDomainMatching/abhinav-sa11.pdf}
}

Patents

Action localization in images and videos using relational features

C. Sun, A. Shrivastava, C. L. Schmid, R. Sukthankar, K. P. Murphy, C. M. Vondrick

US 11163989 · Google Inc.

Visual Tracking by Colorization

A. Shrivastava, A. Fathi, S. G. Cotado, K. P. Murphy, C. M. Vondrick

US20210089777A1 · Google Inc.

Learning Compressible Features

A. Shrivastava, S. Singh, J. Balle, S. A. Haija, N. Johnston, G. Toderici

US20200311548A1 · Google Inc.

Compression of Machine-Learned Models via Entropy Penalized Weight Reparameterization

D. Oktay, S. Singh, J. Balle, A. Shrivastava

US20200364603A1 · Google Inc.

Determining documents that match a query

S. Mehrotra, J. Li, A. Shrivastava

US9442929B2 · Microsoft Technology Licensing LLC