Publications

2025

Panoptic Captioning: Seeking An Equivalency Bridge for Image and Text
Kun-Yu Lin, Hongjun Wang, Weining Ren, Kai Han
NeurIPS 2025

[BibTeX]
@inproceedings{Lin2025PanCap,
 author    = {Kun-Yu Lin and Hongjun Wang and Weining Ren and Kai Han},
 title     = {Panoptic Captioning: Seeking An Equivalency Bridge for Image and Text},
 booktitle = {Conference on Neural Information Processing Systems (NeurIPS)},
 year      = {2025},
}
Fin3R: Fine-Tuning Feed-Forward 3D Reconstruction Models via Monocular Knowledge Distillation
Weining Ren, Hongjun Wang, Xiao Tan, Kai Han
NeurIPS 2025

[BibTeX]
@inproceedings{Ren2025Fin3R,
 author    = {Weining Ren and Hongjun Wang and Xiao Tan and Kai Han},
 title     = {Fin3R: Fine-Tuning Feed-Forward 3D Reconstruction Models via Monocular Knowledge Distillation},
 booktitle = {Conference on Neural Information Processing Systems (NeurIPS)},
 year      = {2025},
}
Wukong's 72 Transformations: High-fidelity 3D Morphing via Flow Models
Minghao Yin, Yukang Cao, Kai Han
NeurIPS 2025

[BibTeX]
@inproceedings{Yin2025Wukong,
 author    = {Minghao Yin and Yukang Cao and Kai Han},
 title     = {Wukong's 72 Transformations: High-fidelity 3D Morphing via Flow Models},
 booktitle = {Conference on Neural Information Processing Systems (NeurIPS)},
 year      = {2025},
}
3DRS: MLLMs Need 3D-Aware Representation Supervision for Scene Understanding
Xiaohu Huang, Jingjing Wu, Qunyi Xie, Kai Han
NeurIPS 2025

[BibTeX]
@inproceedings{Huang2025_3DRS,
 author    = {Xiaohu Huang and Jingjing Wu and Qunyi Xie and Kai Han},
 title     = {3DRS: MLLMs Need 3D-Aware Representation Supervision for Scene Understanding},
 booktitle = {Conference on Neural Information Processing Systems (NeurIPS)},
 year      = {2025},
}
VaMP: Variational Multi-Modal Prompt Learning for Vision-Language Models
Silin Cheng, Kai Han
NeurIPS 2025

[BibTeX]
@inproceedings{Cheng2025VaMP,
 author    = {Silin Cheng and Kai Han},
 title     = {VaMP: Variational Multi-Modal Prompt Learning for Vision-Language Models},
 booktitle = {Conference on Neural Information Processing Systems (NeurIPS)},
 year      = {2025},
}
SEAL: Semantic-Aware Hierarchical Learning for Generalized Category Discovery
Zhenqi He*, Yuanpei Liu*, Kai Han
NeurIPS 2025

[BibTeX]
@inproceedings{He2025SEAL,
 author    = {Zhenqi He and Yuanpei Liu and Kai Han},
 title     = {SEAL: Semantic-Aware Hierarchical Learning for Generalized Category Discovery},
 booktitle = {Conference on Neural Information Processing Systems (NeurIPS)},
 year      = {2025},
}
GSPN-2: Efficient Parallel Sequence Modeling
Hongjun Wang, Yitong Jiang, Collin McCarthy, David Wehr, Hanrong Ye, Xinhao Li, Ka Chun Cheung, Wonmin Byeon, Jinwei Gu, Ke Chen, Kai Han, Hongxu Yin, Pavlo Molchanov, Jan Kautz, Sifei Liu
NeurIPS 2025

[BibTeX]
@inproceedings{Wang2025GSPN2,
 author    = {Hongjun Wang and Yitong Jiang and Collin McCarthy and David Wehr and Hanrong Ye and Xinhao Li and Ka Chun Cheung and Wonmin Byeon and Jinwei Gu and Ke Chen and Kai Han and Hongxu Yin and Pavlo Molchanov and Jan Kautz and Sifei Liu},
 title     = {GSPN-2: Efficient Parallel Sequence Modeling},
 booktitle = {Conference on Neural Information Processing Systems (NeurIPS)},
 year      = {2025},
}
Inpaint4Drag: Repurposing Inpainting Models for Drag-Based Image Editing via Bidirectional Warping
Jingyi Lu, Kai Han
ICCV 2025

[BibTeX]
@inproceedings{Lu2025Inpaint4Drag,
 author    = {Jingyi Lu and Kai Han},
 title     = {Inpaint4Drag: Repurposing Inpainting Models for Drag-Based Image Editing via Bidirectional Warping},
 booktitle = {International Conference on Computer Vision (ICCV)},
 year      = {2025},
}
GRAB: A Challenging GRaph Analysis Benchmark for Large Multimodal Models
Jonathan Roberts, Kai Han, Samuel Albanie
ICCV 2025

[BibTeX]
@inproceedings{Roberts2025GRAB,
 author    = {Jonathan Roberts and Kai Han and Samuel Albanie},
 title     = {GRAB: A Challenging GRaph Analysis Benchmark for Large Multimodal Models},
 booktitle = {International Conference on Computer Vision (ICCV)},
 year      = {2025},
}
GAMEBot: Transparent Assessment of LLM Reasoning in Games
Wenye Lin, Jonathan Roberts, Yunhan Yang, Samuel Albanie, Zongqing Lu, Kai Han
ACL 2025

[BibTeX]
@inproceedings{Lin2025GAMEBot,
 author    = {Wenye Lin and Jonathan Roberts and Yunhan Yang and Samuel Albanie and Zongqing Lu and Kai Han},
 title     = {GAMEBot: Transparent Assessment of LLM Reasoning in Games},
 booktitle = {Annual Meeting of the Association for Computational Linguistics (ACL)},
 year      = {2025},
}
PruneVid: Visual Token Pruning for Efficient Video Large Language Models
Xiaohu Huang, Hao Zhou, Kai Han
ACL 2025

[BibTeX]
@inproceedings{Cai2025PruneVid,
 author    = {Xiaohu Huang and Hao Zhou and Kai Han},
 title     = {PruneVid: Visual Token Pruning for Efficient Video Large Language Models},
 booktitle = {Annual Meeting of the Association for Computational Linguistics (ACL)},
 year      = {2025},
}
Semantic Correspondence: Unified Benchmarking and a Strong Baseline
Kaiyan Zhang, Xinghui Li, Jingyi Lu, Kai Han
TPAMI 2025

[BibTeX]
@article{Zhang2025Semantic,
 author    = {Zhang, Kaiyan and Li, Xinghui and Lu, Jingyi and Han, Kai},
 title     = {Semantic Correspondence: Unified Benchmarking and a Strong Baseline},
 journal   = {IEEE Transactions on Pattern Analysis and Machine Intelligence (TPAMI)},
 year      = {2025},
}
Splat4D: Diffusion-Enhanced 4D Gaussian Splatting for Temporally and Spatially Consistent Content Creation
Minghao Yin, Yukang Cao, Songyou Peng, Kai Han
SIGGRAPH 2025

[BibTeX]
@inproceedings{Yin2025Splat4D,
 author    = {Minghao Yin and Yukang Cao and Songyou Peng and Kai Han},
 title     = {Splat4D: Diffusion-Enhanced 4D Gaussian Splatting for Temporally and Spatially Consistent Content Creation},
 booktitle = {SIGGRAPH},
 year      = {2025},
}
ICE: Intrinsic Concept Extraction from a Single Image via Diffusion Models
Fernando Julio Cendra, Kai Han
CVPR 2025 Highlight presentation (2.8% of submissions)

[BibTeX]
@inproceedings{Cendra2025ICE,
 author    = {Fernando Julio Cendra and Kai Han},
 title     = {ICE: Intrinsic Concept Extraction from a Single Image via Diffusion Models},
 booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
 year      = {2025},
}
Hyperbolic Category Discovery
Yuanpei Liu*, Zhenqi He*, Kai Han
CVPR 2025

[BibTeX]
@inproceedings{Liu2025HypCD,
 author    = {Yuanpei Liu and Zhenqi He and Kai Han},
 title     = {Hyperbolic Category Discovery},
 booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
 year      = {2025},
}
Mr. DETR: Instructive Multi-Route Training for Detection Transformers
Chang-Bin Zhang, Yujie Zhong, Kai Han
CVPR 2025

[BibTeX]
@inproceedings{Zhang2025MrDETR,
 author    = {Chang-Bin Zhang and Jinhong Ni and Yujie Zhong and Kai Han},
 title     = {Mr. DETR: Instructive Multi-Route Training for Detection Transformers},
 booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
 year      = {2025},
}
v-CLR: View-Consistent Learning for Open-World Instance Segmentation
Chang-Bin Zhang, Jinhong Ni, Yujie Zhong, Kai Han
CVPR 2025 Highlight presentation (2.8% of submissions)

[BibTeX]
@inproceedings{Zhang2025vCLR,
 author    = {Chang-Bin Zhang and Jinhong Ni and Yujie Zhong and Kai Han},
 title     = {v-CLR: View-Consistent Learning for Open-World Instance Segmentation},
 booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
 year      = {2025},
}
Parallel Sequence Modeling via Generalized Spatial Propagation Network
Hongjun Wang, Wonmin Byeon, Jiarui Xu, Jinwei Gu, Ka Chun Cheung, Xiaolong Wang, Kai Han†, Jan Kautz, Sifei Liu
CVPR 2025

[BibTeX]
@inproceedings{Wang2025GSPN,
 author    = {Hongjun Wang and Wonmin Byeon and Jiarui Xu and Jinwei Gu and Ka Chun Cheung and Xiaolong Wang and Kai Han and Jan Kautz and Sifei Liu},
 title     = {Parallel Sequence Modeling via Generalized Spatial Propagation Network},
 booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
 year      = {2025},
}
Detecting Open World Objects via Partial Attribute Assignment
Muli Yang, Gabriel James Goenawan, Huaiyuan Qin, Kai Han, Xi Peng, Yanhua Yang, Hongyuan Zhu
CVPR 2025

[BibTeX]
@inproceedings{Yang2025PASS,
 author    = {Muli Yang and Gabriel James Goenawan and Huaiyuan Qin and Kai Han and Xi Peng and Yanhua Yang and Hongyuan Zhu},
 title     = {Detecting Open World Objects via Partial Attribute Assignment},
 booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
 year      = {2025},
}
DebGCD: Debiased Learning with Distribution Guidance for Generalized Category Discovery
Yuanpei Liu, Kai Han
ICLR 2025

[BibTeX]
@inproceedings{Liu2025DebGCD,
 author    = {Yuanpei Liu and Kai Han},
 title     = {DebGCD: Debiased Learning with Distribution Guidance for Generalized Category Discovery},
 booktitle = {International Conference on Learning Representations (ICLR)},
 year      = {2025},
}
HiLo: A Learning Framework for Generalized Category Discovery Robust to Domain Shifts
Hongjun Wang, Sagar Vaze, Kai Han
ICLR 2025

[BibTeX]

Needle Threading: Can LLMs Follow Threads Through Near-Million-Scale Haystacks?
Jonathan Roberts, Kai Han, Samuel Albanie
ICLR 2025

[BibTeX]
@inproceedings{Roberts2025Needle,
 author    = {Jonathan Roberts and Kai Han and Samuel Albanie},
 title     = {Needle Threading: Can LLMs Follow Threads Through Near-Million-Scale Haystacks?},
 booktitle = {International Conference on Learning Representations (ICLR)},
 year      = {2025},
}
BiGR: Harnessing Binary Latent Codes for Image Generation and Improved Visual Representation Capabilities
Shaozhe Hao, Xuantong Liu, Xianbiao Qi, Shihao Zhao, Bojia Zi, Rong Xiao, Kai Han†, Kwan-Yee K. Wong
ICLR 2025

[BibTeX]
@inproceedings{Hao2025BiGR,
 author     = {Shaozhe Hao and Xuantong Liu and Xianbiao Qi and Shihao Zhao and Bojia Zi and Rong Xiao and Kai Han and Kwan-Yee~K. Wong},
 title      = {Bi{GR}: Harnessing Binary Latent Codes for Image Generation and Improved Visual Representation Capabilities}, 
 booktitle  = {International Conference on Learning Representations (ICLR)},
 year       = {2025},
}
AvatarGO: Zero-shot 4D Human-Object Interaction Generation and Animation
Yukang Cao, Liang Pan, Kai Han, Kwan-Yee K. Wong, Ziwei Liu
ICLR 2025

[BibTeX]
@inproceedings{cao2024avatargo,
  title={AvatarGO: Zero-shot 4D Human-Object Interaction Generation and Animation},
  author={Cao, Yukang and Pan, Liang and Han, Kai and Wong, Kwan-Yee~K. and Liu, Ziwei},
	 booktitle = {International Conference on Learning Representations (ICLR)},
  year={2024}
}
VipDiff: Towards Coherent and Diverse Video Inpainting via Training-free Denoising Diffusion Models
Chaohao Xie, Kai Han, Kwan-Yee K. Wong
WACV 2025

[BibTeX]
@inproceedings{Xie2025VipDiff,
 author    = {Chaohao Xie and Kai Han and Kwan-Yee K. Wong},
 title     = {VipDiff: Towards Coherent and Diverse Video Inpainting via Training-free Denoising Diffusion Models},
 booktitle = {IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)},
 year      = {2025},
}
CusConcept: Customized Visual Concept Decomposition with Diffusion Models
Zhi Xu, Shaozhe Hao, Kai Han
WACV 2025

[BibTeX]
@inproceedings{Xu2025CusConcept,
 author    = {Zhi Xu and Shaozhe Hao and Kai Han},
 title     = {CusConcept: Customized Visual Concept Decomposition with Diffusion Models},
 booktitle = {IEEE/CVF Winter Conference on Applications of Computer Vision (WACV)},
 year      = {2025},
}

2024

SciFIBench: Benchmarking Large Multimodal Models for Scientific Figure Interpretation
Jonathan Roberts, Kai Han, Neil Houlsby, Samuel Albanie
NeurIPS 2024

[BibTeX]
@inproceedings{Roberts2024SciFIBench,
 author    = {Jonathan Roberts and Kai Han and Neil Houlsby and Samuel Albanie},
 title     = {SciFIBench: Benchmarking Large Multimodal Models for Scientific Figure Interpretation},
 booktitle = {Conference on Neural Information Processing Systems},
 year      = {2024},
}
Dissecting Out-of-Distribution Detection and Open-Set Recognition: A Critical Analysis of Methods and Benchmarks
Hongjun Wang, Sagar Vaze, Kai Han
IJCV 2024

[BibTeX]
@article{wang2024dissect,
    author    = {Wang, Hongjun and Vaze, Sagar and Han, Kai},
    title     = {Dissecting Out-of-Distribution Detection and Open-Set Recognition: A Critical Analysis of Methods and Benchmarks},
    journal = {International Journal of Computer Vision (IJCV)},
    year      = {2024}
}
RegionDrag: Fast Region-Based Image Editing with Diffusion Models
Jingyi Lu, Xinghui Li, Kai Han
ECCV 2024

[BibTeX]
@inproceedings{lu2024regiondrag,
    author    = {Jingyi Lu and Xinghui Li and Kai Han},
    title     = {RegionDrag: Fast Region-Based Image Editing with Diffusion Models},
    booktitle = {European Conference on Computer Vision (ECCV)},
    year      = {2024},
}
PromptCCD: Learning Gaussian Mixture Prompt Pool for Continual Category Discovery
Fernando Julio Cendra, Bingchen Zhao, Kai Han
ECCV 2024

[BibTeX]
@inproceedings{cendra2024promptccd,
  author    = {Fernando Julio Cendra and Bingchen Zhao and Kai Han},
  title     = {PromptCCD: Learning Gaussian Mixture Prompt Pool for Continual Category Discovery},
  booktitle = {European Conference on Computer Vision},
  year      = {2024}
}
ConceptExpress: Harnessing Diffusion Models for Single-image Unsupervised Concept Extraction
Shaozhe Hao, Kai Han, Zhengyao Lv, Shihao Zhao, Kwan-Yee K. Wong
ECCV 2024 (Oral presentation)

[BibTeX]
@inproceedings{hao2024conceptexpress,
  author    = {Shaozhe Hao and Kai Han and Zhengyao Lv and Shihao Zhao and Kwan-Yee~K. Wong},
  title     = {Concept{E}xpress: Harnessing Diffusion Models for Single-image Unsupervised Concept Extraction},
  booktitle = {European Conference on Computer Vision},
  year      = {2024}
}
IBD-SLAM: Learning Image-Based Depth Fusion for Generalizable SLAM
Minghao Yin, Shangzhe Wu, Kai Han
CVPR 2024

[BibTeX]
@inproceedings{yin2024ibdslam,
 author    = {Minghao Yin and Shangzhe Wu and Kai Han},
 title     = {IBD-SLAM: Learning Image-Based Depth Fusion for Generalizable SLAM},
 booktitle  = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
 year      = {2024},
}
SD4Match: Learning to Prompt Stable Diffusion Model for Semantic Matching
Xinghui Li, Jingyi Lu, Kai Han†, Victor Prisacariu
CVPR 2024

[BibTeX]
@inproceedings{li2024sd4match,
 author    = {Xinghui Li and Jingyi Lu and Kai Han and Victor Prisacariu},
 title     = {SD4Match: Learning to Prompt Stable Diffusion Model for Semantic Matching},
 booktitle  = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
 year      = {2024},
}
DreamAvatar: Text-and-Shape Guided 3D Human Avatar Generation via Diffusion Models
Yukang Cao*, Yan-Pei Cao*, Kai Han, Ying Shan, Kwan-Yee K. Wong
CVPR 2024

[BibTeX]
@article{cao23dream,
 author    = {Yukang Cao and Yan-Pei Cao and Kai Han and Ying Shan and Kwan-Yee K. Wong},
 title     = {DreamAvatar: Text-and-Shape Guided 3D Human Avatar Generation via Diffusion Models},
 journal = {arXiv preprint arXiv:2304.00916},
 year      = {2023},
}
CiPR: An Efficient Framework with Cross-instance Positive Relations for Generalized Category Discovery
Shaozhe Hao, Kai Han, Kwan-Yee K. Wong
TMLR 2024

[BibTeX]
@article{hao23cipr,
  title    = {CiPR: An Efficient Framework with Cross-instance Positive Relations for Generalized Category Discovery},
  author   = {Shaozhe Hao and Kai Han and Kwan-Yee K. Wong},
  journal  = {arXiv preprint arXiv:2304.06928},
  year     = {2023},
}
SPTNet: An Efficient Alternative Framework for Generalized Category Discovery with Spatial Prompt Tuning
Hongjun Wang, Sagar Vaze, Kai Han
ICLR 2024

[BibTeX]
@inproceedings{wang2024sptnet,
 author    = {Hongjun Wang and Sagar Vaze and Kai Han},
 title     = {SPTNet: An Efficient Alternative Framework for Generalized Category Discovery with Spatial Prompt Tuning},
 booktitle  = {International Conference on Learning Representations (ICLR)},
 year      = {2024},
}
FROSTER: Frozen CLIP is a Strong Teacher for Open-Vocabulary Action Recognition
Xiaohu Huang, Hao Zhou, Kun Yao, Kai Han
ICLR 2024

[BibTeX]
@inproceedings{huang2024froster,
 author    = {Xiaohu Huang and Hao Zhou and Kun Yao and Kai Han},
 title     = {FROSTER: Frozen CLIP is a Strong Teacher for Open-Vocabulary Action Recognition},
 booktitle  = {International Conference on Learning Representations (ICLR)},
 year      = {2024},
}

2023

HeadSculpt: Crafting 3D Head Avatars with Text
Xiao Han*, Yukang Cao*, Kai Han, Xiatian Zhu, Jiankang Deng, Yi-Zhe Song, Tao Xiang, Kwan-Yee K. Wong
NeurIPS 2023

[BibTeX]
@inproceedings{han2023headsculpt,
 author    = {Xiao Han and Yukang Cao and Kai Han and Xiatian Zhu and Jiankang Deng and Yi-Zhe Song and Tao Xiang and Kwan-Yee K. Wong},
 title     = {HeadSculpt: Crafting 3D Head Avatars with Text},
 booktitle  = {Conference on Neural Information Processing Systems (NeurIPS)},
 year      = {2023},
}
DualRC: A Dual-Resolution Learning Framework with Neighbourhood Consensus for Visual Correspondences
Xinghui Li, Kai Han, Shuda Li, Victor Prisacariu
TPAMI 2023

[BibTeX]
@article{li23dualrc,
 author  = {Xinghui Li and Kai Han and Shuda Li and Victor Prisacariu},
 title   = {DualRC: A Dual-Resolution Learning Framework with Neighbourhood Consensus for Visual Correspondences},
 journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence (TPAMI)},
 year    = {2023},
}
Learning Semi-supervised Gaussian Mixture Models for Generalized Category Discovery
Bingchen Zhao, Xin Wen, Kai Han
ICCV 2023

[BibTeX]
@inproceedings{zhao23learning,
 author    = {Bingchen Zhao and Xin Wen and Kai Han},
 title     = {Learning Semi-supervised Gaussian Mixture Models for Generalized Category Discovery},
 booktitle = {International Conference on Computer Vision (ICCV)},
 year      = {2023},
}
Open-Vocabulary Semantic Segmentation with Decoupled One-Pass Network
Cong Han, Yujie Zhong, Dengjie Li, Kai Han, Lin Ma
ICCV 2023

[BibTeX]
@inproceedings{han23open,
 author    = {Cong Han and Yujie Zhong and Dengjie Li and Kai Han and Lin Ma},
 title     = {Open-Vocabulary Semantic Segmentation with Decoupled One-Pass Network},
 booktitle = {International Conference on Computer Vision (ICCV)},
 year      = {2023},
}
Learning Attention as Disentangler for Compositional Zero-shot Learning
Shaozhe Hao, Kai Han, Kwan-Yee K. Wong
CVPR 2023

[BibTeX]
@inproceedings{hao2023ade,
 author    = {Shaozhe Hao and Kai Han and Kwan-Yee K. Wong},
 title     = {Learning Attention as Disentangler for Compositional Zero-shot Learning},
 booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
 year      = {2023},
}
SeSDF: Self-evolved Signed Distance Field for Implicit 3D Clothed Human Reconstruction
Yukang Cao, Kai Han, Kwan-Yee K. Wong
CVPR 2023

[BibTeX]
@inproceedings{cao2023sesdf,
author    = {Yukang Cao and Kai Han and Kwan-Yee K. Wong},
title     = {SeSDF: Self-evolved Signed Distance Field for Implicit 3D Clothed Human Reconstruction},
booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
year      = {2023},
}

2022

Novel Class Discovery without Forgetting
K J Joseph, Sujoy Paul, Gaurav Aggarwal, Soma Biswas, Piyush Rai, Kai Han, Vineeth N Balasubramanian
ECCV 2022

[BibTeX]
@inproceedings{joseph22ncdwf,
 author    = {K J Joseph and Sujoy Paul and Gaurav Aggarwal and Soma Biswas and Piyush Rai and Kai Han and Vineeth N Balasubramanian},
 title     = {Novel Class Discovery without Forgetting},
 booktitle = {European Conference on Computer Vision (ECCV)},
 year      = {2022},
}
Generalized Category Discovery
Sagar Vaze, Kai Han, Andrea Vedaldi, Andrew Zisserman
CVPR 2022

[BibTeX]
@inproceedings{vaze22generalized,
 author    = {Sagar Vaze and Kai Han and Andrea Vedaldi and Andrew Zisserman},
 title     = {Generalized Category Discovery},
 booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
 year      = {2022},
}
JIFF: Jointly-aligned Implicit Face Function for High Quality Single View Clothed Human Reconstruction
Yukang Cao, Guanying Chen, Kai Han, Wenqi Yang, Kwan-Yee K. Wong
CVPR 2022 (Oral presentation)

[BibTeX]
@inproceedings{cao22jiff,
 author    = {Yukang Cao and Guanying Chen and Kai Han and Wenqi Yang and Kwan-Yee K. Wong},
 title     = {JIFF: Jointly-aligned Implicit Face Function for High Quality Single View Clothed Human Reconstruction},
 booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
 year      = {2022},
}
SharpContour: A Contour-based Boundary Refinement Approach for Efficient and Accurate Instance Segmentation
Chenming Zhu, Xuanye Zhang, Yanran Li, Liangdong Qiu, Kai Han, Xiaoguang Han
CVPR 2022

[BibTeX]
@inproceedings{zhu22sharpcontour,
 author    = {Chenming Zhu and Xuanye Zhang and Yanran Li and Liangdong Qiu and Kai Han and Xiaoguang Han},
 title     = {SharpContour: A Contour-based Boundary Refinement Approach for Efficient and Accurate Instance Segmentation},
 booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
 year      = {2022},
}
Spacing Loss for Discovering Novel Categories
K J Joseph, Sujoy Paul, Gaurav Aggarwal, Soma Biswas, Piyush Rai, Kai Han, Vineeth N Balasubramanian
CVPRW 2022 (Best Paper Runner-Up Award)

[BibTeX]
@inproceedings{joseph22spacing,
 author    = {K J Joseph and Sujoy Paul and Gaurav Aggarwal and Soma Biswas and Piyush Rai and Kai Han and Vineeth N Balasubramanian},
 title     = {Spacing Loss for Discovering Novel Categories},
 booktitle = {CVPR Workshop on Continual Learning in Computer Vision},
 year      = {2022},
}
Open-Set Recognition: A Good Closed-Set Classifier is All You Need?
Sagar Vaze, Kai Han, Andrea Vedaldi, Andrew Zisserman
ICLR 2022 (Oral presentation)

[BibTeX]
@inproceedings{vaze22openset,
 author    = {Sagar Vaze and Kai Han and Andrea Vedaldi and Andrew Zisserman},
 title     = {Open-Set Recognition: A Good Closed-Set Classifier is All You Need?},
 booktitle = {International Conference on Learning Representations (ICLR)},
 year      = {2022},
}

2021

Novel Visual Category Discovery with Dual Ranking Statistics and Mutual Knowledge Distillation
Bingchen Zhao, Kai Han
NeurIPS 2021

[BibTeX]
@inproceedings{zhao21novel,
 author     = {Bingchen Zhao and Kai Han},
 title      = {Novel Visual Category Discovery with Dual Ranking Statistics and Mutual Knowledge Distillation},
 booktitle  = {Conference on Neural Information Processing Systems (NeurIPS)},
 year       = {2021}
}
Joint Representation Learning and Novel Category Discovery on Single- and Multi-modal Data
Xuhui Jia, Kai Han, Yukun Zhu, Bradley Green
ICCV 2021

[BibTeX]
@inproceedings{jia21joint,
 author    = {Xuhui Jia and Kai Han and Yukun Zhu and Bradley Green},
 title     = {Joint Representation Learning and Novel Category Discovery on Single- and Multi-modal Data},
 booktitle = {International Conference on Computer Vision (ICCV)},
 year      = {2021}
}
XResolution Correspondence Networks
Georgi Tinchev, Shuda Li, Kai Han, David Mitchell, Rigas Kouskouridas
BMVC 2021

[BibTeX]
@inproceedings{tinchev20xresolution,
 author    = {Georgi Tinchev and Shuda Li and Kai Han and David Mitchell and Rigas Kouskouridas},
 title     = {{$\mathbb{X}$}Resolution Correspondence Networks},
 booktitle = {British Machine Vision Conference (BMVC)},
 year      = {2021}
}
LSD-C: Linearly Separable Deep Clusters
Sylvestre-Alvise Rebuffi*, Sebastien Ehrhardt*, Kai Han*, Andrea Vedaldi, Andrew Zisserman
ICCVW 2021

[BibTeX]
@inproceedings{rebuffi21lsdc,
 author    = {Sylvestre-Alvise Rebuffi and Sebastien Ehrhardt and Kai Han and Andrea Vedaldi and Andrew Zisserman},
 title     = {LSD-C: Linearly Separable Deep Clusters},
 booktitle = {ICCV Workshop on Visual Inductive Priors for Data-Efficient Deep Learning},
 year      = {2021}
}
Contrastive Learning based Hybrid Networks for Long-Tailed Image Classification
Peng Wang, Kai Han, Xiu-Shen Wei, Lei Zhang, Lei Wang
CVPR 2021

[BibTeX]
@inproceedings{wang21contrastive,
 author     = {Peng Wang and Kai Han and Xiu-Shen Wei and Lei Zhang and Lei Wang},
 title      = {Contrastive Learning based Hybrid Networks for Long-Tailed Image Classification},
 booktitle  = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
 year       = {2021},
}
AutoNovel: Automatically Discovering and Learning Novel Visual Categories
Kai Han, Sylvestre-Alvise Rebuffi, Sebastien Ehrhardt, Andrea Vedaldi, Andrew Zisserman
TPAMI 2021

[BibTeX]
@article{han21autonovel,
 author  = {Kai Han and Sylvestre-Alvise Rebuffi and Sebastien Ehrhardt and Andrea Vedaldi and Andrew Zisserman},
 title   = {AutoNovel: Automatically Discovering and Learning Novel Visual Categories},
 journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence (TPAMI)},
 year    = {2021},
}
Anisotropic Convolutional Neural Networks for RGB-D based Semantic Scene Completion
Jie Li, Peng Wang, Kai Han, Yu Liu
TPAMI 2021

[BibTeX]
@article{li21anisotropic,
 author  = {Jie Li and Peng Wang and Kai Han and Yu Liu},
 title   = {Anisotropic Convolutional Neural Networks for RGB-D based Semantic Scene Completion},
 journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence (TPAMI)},
 year    = {2021},
}
Fixed Viewpoint Mirror Surface Reconstruction under an Uncalibrated Camera
Kai Han, Miaomiao Liu, Dirk Schnieders, Kwan-Yee K. Wong
TIP 2021

[BibTeX]
@article{han21fixed,
 title   = {Fixed Viewpoint Mirror Surface Reconstruction under an Uncalibrated Camera},
 author  = {Kai Han and Miaomiao Liu and Dirk Schnieders and Kwan-Yee K. Wong},
 journal = {IEEE Transactions on Image Processing (TIP)},
 year    = {2021}
}

2020

Dual-Resolution Correspondence Networks
Xinghui Li, Kai Han, Shuda Li, Victor Prisacariu
NeurIPS 2020

[BibTeX]
@inproceedings{li20dualrc,
 author     = {Xinghui Li and Kai Han and Shuda Li and Victor Prisacariu},
 title      = {Dual-Resolution Correspondence Networks},
 booktitle  = {Conference on Neural Information Processing Systems (NeurIPS)},
 year       = {2020},
}
Automatically Discovering and Learning New Visual Categories with Ranking Statistics
Kai Han*, Sylvestre-Alvise Rebuffi*, Sebastien Ehrhardt*, Andrea Vedaldi, Andrew Zisserman
ICLR 2020

[BibTeX]
@inproceedings{han20automatically,
 author    = {Kai Han and Sylvestre-Alvise Rebuffi and Sebastien Ehrhardt and Andrea Vedaldi and Andrew Zisserman},
 title     = {Automatically Discovering and Learning New Visual Categories with Ranking Statistics},
 booktitle = {International Conference on Learning Representations (ICLR)},
 year      = {2020},
}
Correspondence Networks with Adaptive Neighbourhood Consensus
Shuda Li*, Kai Han*, Theo W. Costain, Henry Howard-Jenkins, Victor Prisacariu
CVPR 2020

[BibTeX]
@inproceedings{li20correspondence,
 author    = {Shuda Li and Kai Han and Theo W. Costain and Henry Howard-Jenkins and Victor Prisacariu},
 title     = {Correspondence Networks with Adaptive Neighbourhood Consensus},
 booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
 year      = {2020},
}
Anisotropic Convolutional Networks for 3D Semantic Scene Completion
Jie Li, Kai Han, Peng Wang, Yu Liu, Xia Yuan
CVPR 2020

[BibTeX]
@inproceedings{li20anisotropic,
 author    = {Jie Li and Kai Han and Peng Wang and Yu Liu and Xia Yuan},
 title     = {Anisotropic Convolutional Networks for 3D Semantic Scene Completion},
 booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
 year      = {2020}
}
Semi-Supervised Learning with Scarce Annotations
Sylvestre-Alvise Rebuffi*, Sebastien Ehrhardt*, Kai Han*, Andrea Vedaldi, Andrew Zisserman
CVPRW 2020

[BibTeX]
@inproceedings{rebuffi20SSL,
 title={Semi-Supervised Learning with Scarce Annotations},
 author={Sylvestre-Alvise Rebuffi and Sebastien Ehrhardt and Kai Han and  Andrea Vedaldi and Andrew Zisserman},
 booktitle={CVPR Deep Vision Workshop},
 year={2020}
}
Deep Photometric Stereo for Non-Lambertian Surfaces
Guanying Chen, Kai Han, Boxin Shi, Yasuyuki Matsushita, Kwan-Yee K. Wong
TPAMI 2020

[BibTeX]
@inproceedings{han19DTC,
 author    = {Kai Han and Andrea Vedaldi and Andrew Zisserman},
 title     = {Learning to Discover Novel Visual Categories via Deep Transfer Clustering},
 booktitle = {International Conference on Computer Vision (ICCV)},
 year      = {2019}
}

2019

Learning to Discover Novel Visual Categories via Deep Transfer Clustering
Kai Han, Andrea Vedaldi, Andrew Zisserman
ICCV 2019

[BibTeX]
@inproceedings{han19DTC,
 author    = {Kai Han and Andrea Vedaldi and Andrew Zisserman},
 title     = {Learning to Discover Novel Visual Categories via Deep Transfer Clustering},
 booktitle = {International Conference on Computer Vision (ICCV)},
 year      = {2019}
}
Unsupervised Image Matching and Object Discovery as Optimization
Huy V. Vo, Francis Bach, Minsu Cho, Kai Han, Yann LeCun, Patrick Pérez, Jean Ponce
CVPR 2019

[BibTeX]
@inproceedings{vo19unsup,
 title     = {Unsupervised Image Matching and Object Discovery as Optimization},
 author    = {Huy V. Vo and Francis Bach and Minsu Cho and Kai Han and Yann LeCun and Patrick P\'{e}rez and Jean Ponce},
 booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
 year      = {2019}
}
Self-calibrating Deep Photometric Stereo Networks
Guanying Chen, Kai Han, Boxin Shi, Yasuyuki Matsushita, Kwan-Yee K. Wong
CVPR 2019 (Oral presentation)

[BibTeX]
@inproceedings{chen19SDPS_Net,
 title     = {Self-calibrating Deep Photometric Stereo Networks},
 author    = {Guanying Chen and Kai Han and Boxin Shi and Yasuyuki Matsushita and Kwan-Yee K. Wong},
 booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
 year      = {2019}
}
SLearning Transparent Object Matting
Guanying Chen*, Kai Han*, Kwan-Yee K. Wong
IJCV 2019

[BibTeX]
@article{chen19LTOM,
 title   = {Learning Transparent Object Matting},
 author  = {Guanying Chen and Kai Han and Kwan-Yee K. Wong},
 journal = {International Journal of Computer Vision (IJCV)},
 year    = {2019}
}

2018

PS-FCN: A Flexible Learning Framework for Photometric Stereo
Guanying Chen, Kai Han, Kwan-Yee K. Wong
ECCV 2018

[BibTeX]
@inproceedings{chen18ps_fcn,
 title     = {PS-FCN: A Flexible Learning Framework for Photometric Stereo},
 author    = {Guanying Chen and Kai Han and Kwan-Yee K. Wong},
 booktitle = {European Conference on Computer Vision (ECCV)},
 year      = {2018}
}
TOM-Net: Learning Transparent Object Matting from a Single Image
Guanying Chen*, Kai Han*, Kwan-Yee K. Wong
CVPR 2018 (Spotlight presentation)

[BibTeX]
@inproceedings{chen18tom_net,
 title     = {TOM-Net: Learning Transparent Object Matting from a Single Image},
 author    = {Guanying Chen and Kai Han and Kwan-Yee K. Wong},
 booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
 year      = {2018}
}
Dense Reconstruction of Transparent Objects by Altering Incident Light Paths Through Refraction
Kai Han, Kwan-Yee K. Wong, Miaomiao Liu
IJCV 2018

[BibTeX]
@article{han18dense,
 title   = {Dense Reconstruction of Transparent Objects by Altering Incident Light Paths through Refraction},
 author  = {Kai Han and Kwan-Yee K. Wong and Miaomiao Liu},
 journal = {International Journal of Computer Vision (IJCV)},
 year    = {2018}
}

2017

SCNet: Learning Semantic Correspondence
Kai Han, Rafael S. Rezende, Bumsub Ham, Kwan-Yee K. Wong, Minsu Cho, Cordelia Schmid, Jean Ponce
ICCV 2017

[BibTeX]
@inproceedings{han17scnet,
 title     = {SCNet: Learning Semantic Correspondence},
 author    = {Kai Han and Rafael S. Rezende and Bumsub Ham and Kwan-Yee K. Wong and Minsu Cho and Cordelia Schmid and Jean Ponce},
 booktitle = {International Conference on Computer Vision (ICCV)},
 year      = {2017}
}

2016

Single View 3D Reconstruction under an Uncalibrated Camera and an Unknown Mirror Sphere
Kai Han, Kwan-Yee K. Wong, Xiao Tan
3DV 2016

[BibTeX]
@inproceedings{han16single,
 author    = {Kai Han and Kwan-Yee K. Wong and Xiao Tan},
 title     = {Single View 3D Reconstruction under an Uncalibrated Camera and an Unknown Mirror Sphere},
 booktitle = {International Conference on 3D Vision (3DV)},
 year      = {2016}
}
Mirror Surface Reconstruction Under an Uncalibrated Camera
Kai Han, Kwan-Yee K. Wong, Dirk Schnieders, Miaomiao Liu
CVPR 2016

[BibTeX]
@inproceedings{han16mirror,
 author    = {Kai Han and Kwan-Yee K. Wong and Dirk Schnieders and Miaomiao Liu},
 title     = {Mirror Surface Reconstruction under an Uncalibrated Camera},
 booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
 year      = {2016}
}

2015

A Fixed Viewpoint Approach for Dense Reconstruction of Transparent Objects
Kai Han, Kwan-Yee K. Wong, Miaomiao Liu
CVPR 2015

[BibTeX]
@inproceedings{han15afixed,
 author    = {Kai Han and Kwan-Yee K. Wong and Miaomiao Liu},
 title     = {A Fixed Viewpoint Approach for Dense Reconstruction of Transparent Objects},
 booktitle = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR)},
 year      = {2015}
}

Preprints

PartCo: Part-Level Correspondence Priors Enhance Category Discovery
Fernando Julio Cendra, Kai Han
arXiv preprint, 2025

[BibTeX]
@article{Cendra2025PartCo,
 author    = {Fernando Julio Cendra and Kai Han},
 title     = {PartCo: Part-Level Correspondence Priors Enhance Category Discovery},
 journal   = {arXiv preprint arXiv:2509.22542},
 year      = {2025},
}
Category Discovery: An Open-World Perspective
Zhenqi He, Yuanpei Liu, Kai Han
arXiv preprint, 2025

[BibTeX]
@article{He2025CategoryDiscovery,
 author    = {Zhenqi He and Yuanpei Liu and Kai Han},
 title     = {Category Discovery: An Open-World Perspective},
 journal   = {arXiv preprint arXiv:2502.09696},
 year      = {2025},
}
ZeroBench: An Impossible Visual Benchmark for Contemporary Large Multimodal Models
Jonathan Roberts, Mohammad Reza Taesiri, Ansh Sharma, Akash Gupta, Kai Han, Samuel Albanie
arXiv preprint, 2025

[BibTeX]
@article{Roberts2025ZeroBench,
 author    = {Jonathan Roberts and Mohammad Reza Taesiri and Ansh Sharma and Akash Gupta and Kai Han and Samuel Albanie},
 title     = {ZeroBench: An Impossible Visual Benchmark for Contemporary Large Multimodal Models},
 journal   = {arXiv preprint arXiv:2507.06261},
 year      = {2025},
}
ViCo: Detail-Preserving Visual Condition for Personalized Text-to-Image Generation
Shaozhe Hao, Kai Han†, Shihao Zhao, Kwan-Yee K. Wong
arXiv preprint, 2023

[BibTeX]
@article{hao2023ViCo,
 author    = {Shaozhe Hao and Kai Han and Shihao Zhao and Kwan-Yee K. Wong},
 title     = {ViCo: Detail-Preserving Visual Condition for Personalized Text-to-Image Generation},
 journal = {arXiv preprint arXiv:2306.00971},
 year      = {2023},
}
GPT4GEO: How a Language Model Sees the World's Geography
Jonathan Roberts, Timo Lüddecke, Sowmen Das, Kai Han, Samuel Albanie
arXiv preprint, 2023

[BibTeX]
@article{roberts2023gpt4geo,
  title    = {GPT4GEO: How a Language Model Sees the World's Geography},
  author   = {Roberts, Jonathan and L{\"u}ddecke, Timo and Das, Sowmen and Han, Kai and Albanie, Samuel},
  journal  = {arXiv preprint arXiv:2306.00020},
  year     = {2023},
}
What’s in a Name? Beyond Class Indices for Image Recognition
Kai Han*, Yandong Li*, Sagar Vaze*, Jie Li, Xuhui Jia
arXiv preprint, 2023

[BibTeX]
@article{han23scd,
 author    = {Kai Han and Yandong Li and Sagar Vaze and Jie Li and Xuhui Jia},
 title     = {What's in a Name? Beyond Class Indices for Image Recognition},
 journal = {arXiv preprint arXiv:2304.02364},
 year      = {2023},
}
HeadSculpt: Crafting 3D Head Avatars with Text
Xiao Han*, Yukang Cao*, Kai Han, Xiatian Zhu, Jiankang Deng, Yi-Zhe Song, Tao Xiang, Kwan-Yee K. Wong
arXiv preprint, 2023

[BibTeX]
@article{han2023headsculpt,
 author    = {Xiao Han and Yukang Cao and Kai Han and Xiatian Zhu and Jiankang Deng and Yi-Zhe Song and Tao Xiang and Kwan-Yee K. Wong},
 title     = {HeadSculpt: Crafting 3D Head Avatars with Text},
 journal = {arXiv preprint arXiv:2306.03038},
 year      = {2023},
}
SimSC: A Simple Framework for Semantic Correspondence with Temperature Learning
Xinghui Li, Kai Han, Xingchen Wan, Victor Adrian Prisacariu
arXiv preprint, 2023

[BibTeX]
@article{li23SimSC,
  title    = {SimSC: A Simple Framework for Semantic Correspondence with Temperature Learning},
  author   = {Xinghui Li and Kai Han and Xingchen Wan and Victor Adrian Prisacariu},
  journal  = {arXiv preprint arXiv:2305.02385},
  year     = {2023},
}
SATIN: A Multi-Task Metadataset for Classifying Satellite Imagery using Vision-Language Models
Jonathan Roberts, Kai Han, Samuel Albanie
arXiv preprint, 2023

[BibTeX]
@article{roberts2023satin,
  title    = {SATIN: A Multi-Task Metadataset for Classifying Satellite Imagery using Vision-Language Models},
  author   = {Jonathan Roberts and Kai Han and Samuel Albanie},
  journal  = {arXiv preprint arXiv:2304.11619},
  year     = {2023},
}
Learning Inverse Rendering of Faces from Real-world Videos
Yuda Qiu*, Zhangyang Xiong*, Kai Han, Zhongyuan Wang, Zixiang Xiong, Xiaoguang Han
arXiv preprint, 2020

[BibTeX]
@article{qiu20learning,
 author  = {Yuda Qiu and Zhangyang Xiong and Kai Han and Zhongyuan Wang and Zixiang Xiong and Xiaoguang Han},
 title   = {Learning Inverse Rendering of Faces from Real-world Videos},
 journal = {arXiv preprint arXiv:2003.12047},
 year    = {2020},
}