2024 ANAH: Analytical Annotation of Hallucinations in Large Language Models Ziwei Ji, Yuzhe Gu, Wenwei Zhang, and 3 more authors In Proceedings of the Annual Meeting of the Association for Computational Linguistics (ACL) 2024 Bib PDF Code Website @inproceedings{ji2024anah, title = {ANAH: Analytical Annotation of Hallucinations in Large Language Models}, author = {Ji, Ziwei and Gu, Yuzhe and Zhang, Wenwei and Lyu, Chengqi and Lin, Dahua and Chen, Kai}, booktitle = {Proceedings of the Annual Meeting of the Association for Computational Linguistics (ACL)}, year = {2024}, } T-Eval: Evaluating the Tool Utilization Capability of Large Language Models Step by Step Zehui Chen, Weihua Du, Wenwei Zhang, and 8 more authors In Proceedings of the Annual Meeting of the Association for Computational Linguistics (ACL) 2024 Bib PDF Code Website @inproceedings{chen2024t, title = {T-Eval: Evaluating the Tool Utilization Capability of Large Language Models Step by Step}, author = {Chen, Zehui and Du, Weihua and Zhang, Wenwei and Liu, Kuikun and Liu, Jiangning and Zheng, Miao and Zhuo, Jingming and Zhang, Songyang and Lin, Dahua and Chen, Kai and Zhao, Feng}, booktitle = {Proceedings of the Annual Meeting of the Association for Computational Linguistics (ACL)}, year = {2024}, } Agent-FLAN: Designing Data and Methods of Effective Agent Tuning for Large Language Models Zehui Chen, Kuikun Liu, Qiuchen Wang, and 5 more authors In Findings of the Association for Computational Linguistics: ACL 2024 Bib PDF Code @inproceedings{chen2024agent, title = {Agent-FLAN: Designing Data and Methods of Effective Agent Tuning for Large Language Models}, author = {Chen, Zehui and Liu, Kuikun and Wang, Qiuchen and Zhang, Wenwei and Liu, Jiangning and Lin, Dahua and Chen, Kai and Zhao, Feng}, booktitle = {Findings of the Association for Computational Linguistics: ACL}, year = {2024}, } LLaST: Improved End-to-end Speech Translation System Leveraged by Large Language Models Xi Chen, Songyang Zhang, Qibing Bai, and 2 more authors In Findings of the Association for Computational Linguistics: ACL 2024 Bib @inproceedings{chen2024llast, title = {LLaST: Improved End-to-end Speech Translation System Leveraged by Large Language Models}, author = {Chen, Xi and Zhang, Songyang and Bai, Qibing and Chen, Kai and Nakamura, Satoshi}, booktitle = {Findings of the Association for Computational Linguistics: ACL}, year = {2024}, } MathBench: Evaluating the Theory and Application Proficiency of LLMs with a Hierarchical Mathematics Benchmark Hongwei Liu, Zilong Zheng, Yuxuan Qiao, and 7 more authors In Findings of the Association for Computational Linguistics: ACL 2024 Bib PDF Code @inproceedings{liu2024mathbench, title = {MathBench: Evaluating the Theory and Application Proficiency of LLMs with a Hierarchical Mathematics Benchmark}, author = {Liu, Hongwei and Zheng, Zilong and Qiao, Yuxuan and Duan, Haodong and Fei, Zhiwei and Zhou, Fengzhe and Zhang, Wenwei and Zhang, Songyang and Lin, Dahua and Chen, Kai}, booktitle = {Findings of the Association for Computational Linguistics: ACL}, year = {2024}, } Differential Model Scaling using Differential Topk Kai Liu, Ruohui Wang, Jianfei Gao, and 1 more author In International Conference on Machine Learning (ICML) 2024 Bib @inproceedings{liu2024differential, title = {Differential Model Scaling using Differential Topk}, author = {Liu, Kai and Wang, Ruohui and Gao, Jianfei and Chen, Kai}, booktitle = {International Conference on Machine Learning (ICML)}, year = {2024}, } Can AI Assistants Know What They Don’t Know? Qinyuan Cheng, Tianxiang Sun, Xiangyang Liu, and 6 more authors In International Conference on Machine Learning (ICML) 2024 Bib PDF Code @inproceedings{cheng2024can, title = {Can AI Assistants Know What They Don't Know?}, author = {Cheng, Qinyuan and Sun, Tianxiang and Liu, Xiangyang and Zhang, Wenwei and Yin, Zhangyue and Li, Shimin and Li, Linyang and Chen, Kai and Qiu, Xipeng}, booktitle = {International Conference on Machine Learning (ICML)}, year = {2024}, } Ada-LEval: Evaluating long-context LLMs with length-adaptable benchmarks Chonghua Wang, Haodong Duan, Songyang Zhang, and 2 more authors In NAACL 2024 Bib PDF Code @inproceedings{wang2024ada, title = {Ada-LEval: Evaluating long-context LLMs with length-adaptable benchmarks}, author = {Wang, Chonghua and Duan, Haodong and Zhang, Songyang and Lin, Dahua and Chen, Kai}, booktitle = {NAACL}, year = {2024}, } BotChat: Evaluating LLMs’ Capabilities of Having Multi-Turn Dialogues Haodong Duan, Jueqi Wei, Chonghua Wang, and 5 more authors In NAACL findings 2024 Bib PDF Code @inproceedings{duan2023botchat, title = {BotChat: Evaluating LLMs' Capabilities of Having Multi-Turn Dialogues}, author = {Duan, Haodong and Wei, Jueqi and Wang, Chonghua and Liu, Hongwei and Fang, Yixiao and Zhang, Songyang and Lin, Dahua and Chen, Kai}, booktitle = {NAACL findings}, year = {2024}, } PIA: Your Personalized Image Animator via Plug-and-Play Modules in Text-to-Image Models Yiming Zhang, Zhening Xing, Yanhong Zeng, and 2 more authors In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) 2024 Bib PDF Code Website @inproceedings{zhang2024pia, title = {PIA: Your Personalized Image Animator via Plug-and-Play Modules in Text-to-Image Models}, author = {Zhang, Yiming and Xing, Zhening and Zeng, Yanhong and Fang, Youqing and Chen, Kai}, booktitle = {Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)}, year = {2024}, } Make-It-Vivid: Dressing Your Animatable Biped Cartoon Characters from Text Junshu Tang, Yanhong Zeng, Ke Fan, and 4 more authors In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) 2024 Bib PDF Code Website @inproceedings{tang2024make, title = {Make-It-Vivid: Dressing Your Animatable Biped Cartoon Characters from Text}, author = {Tang, Junshu and Zeng, Yanhong and Fan, Ke and Wang, Xuheng and Dai, Bo and Chen, Kai and Ma, Lizhuang}, booktitle = {Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)}, year = {2024}, } EmbodiedScan: A Holistic Multi-Modal 3D Perception Suite Towards Embodied AI Tai Wang, Xiaohan Mao, Chenming Zhu, and 11 more authors In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) 2024 Bib PDF Code Website @inproceedings{wang2023embodiedscan, title = {EmbodiedScan: A Holistic Multi-Modal 3D Perception Suite Towards Embodied AI}, author = {Wang, Tai and Mao, Xiaohan and Zhu, Chenming and Xu, Runsen and Lyu, Ruiyuan and Li, Peisen and Chen, Xiao and Zhang, Wenwei and Chen, Kai and Xue, Tianfan and Liu, Xihui and Lu, Cewu and Lin, Dahua and Pang, Jiangmiao}, booktitle = {Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)}, year = {2024}, } OMG-Seg: Is One Model Good Enough For All Segmentation? Xiangtai Li, Haobo Yuan, Wei Li, and 6 more authors In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) 2024 Bib PDF Code Website @inproceedings{li2024omg, title = {OMG-Seg: Is One Model Good Enough For All Segmentation?}, author = {Li, Xiangtai and Yuan, Haobo and Li, Wei and Ding, Henghui and Wu, Size and Zhang, Wenwei and Li, Yining and Chen, Kai and Loy, Chen Change}, booktitle = {Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)}, year = {2024}, } Towards language-driven video inpainting via multimodal large language models Jianzong Wu, Xiangtai Li, Chenyang Si, and 8 more authors In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) 2024 Bib PDF Code Website @inproceedings{wu2024towards, title = {Towards language-driven video inpainting via multimodal large language models}, author = {Wu, Jianzong and Li, Xiangtai and Si, Chenyang and Zhou, Shangchen and Yang, Jingkang and Zhang, Jiangning and Li, Yining and Chen, Kai and Tong, Yunhai and Liu, Ziwei and Loy, Chen Change}, booktitle = {Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)}, year = {2024}, } From Pixels to Graphs: Open-Vocabulary Scene Graph Generation with Vision-Language Models Rongjie Li, Songyang Zhang, Dahua Lin, and 2 more authors In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) 2024 Bib PDF @inproceedings{li2024pixels, title = {From Pixels to Graphs: Open-Vocabulary Scene Graph Generation with Vision-Language Models}, author = {Li, Rongjie and Zhang, Songyang and Lin, Dahua and Chen, Kai and He, Xuming}, booktitle = {Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)}, year = {2024}, } RTMO: Towards High-Performance One-Stage Real-Time Multi-Person Pose Estimation Peng Lu, Tao Jiang, Yining Li, and 3 more authors In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) 2024 Bib PDF Code @inproceedings{lu2024rtmo, title = {RTMO: Towards High-Performance One-Stage Real-Time Multi-Person Pose Estimation}, author = {Lu, Peng and Jiang, Tao and Li, Yining and Li, Xiangtai and Chen, Kai and Yang, Wenming}, booktitle = {Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)}, year = {2024}, } 2023 Segment Any Point Cloud Sequences by Distilling Vision Foundation Models Youquan Liu, Lingdong Kong, Jun Cen, and 5 more authors Advances in Neural Information Processing Systems (NeurIPS) 2023 Bib PDF Code @article{liu2023segment, title = {Segment Any Point Cloud Sequences by Distilling Vision Foundation Models}, author = {Liu, Youquan and Kong, Lingdong and Cen, Jun and Chen, Runnan and Zhang, Wenwei and Pan, Liang and Chen, Kai and Liu, Ziwei}, journal = {Advances in Neural Information Processing Systems (NeurIPS)}, year = {2023}, } Improving Pixel-based MIM by Reducing Wasted Modeling Capability Yuan Liu, Songyang Zhang, Jiacheng Chen, and 3 more authors In Proceedings of the IEEE International Conference on Computer Vision (ICCV) 2023 Bib PDF Code @inproceedings{liu2023improving, title = {Improving Pixel-based MIM by Reducing Wasted Modeling Capability}, author = {Liu, Yuan and Zhang, Songyang and Chen, Jiacheng and Yu, Zhaohui and Chen, Kai and Lin, Dahua}, booktitle = {Proceedings of the IEEE International Conference on Computer Vision (ICCV)}, year = {2023}, } Robo3d: Towards robust and reliable 3d perception against corruptions Lingdong Kong, Youquan Liu, Xin Li, and 6 more authors In Proceedings of the IEEE International Conference on Computer Vision (ICCV) 2023 Bib PDF Code @inproceedings{kong2023robo3d, title = {Robo3d: Towards robust and reliable 3d perception against corruptions}, author = {Kong, Lingdong and Liu, Youquan and Li, Xin and Chen, Runnan and Zhang, Wenwei and Ren, Jiawei and Pan, Liang and Chen, Kai and Liu, Ziwei}, booktitle = {Proceedings of the IEEE International Conference on Computer Vision (ICCV)}, year = {2023}, } Multimodal-gpt: A vision and language model for dialogue with humans Tao Gong, Chengqi Lyu, Shilong Zhang, and 7 more authors arXiv preprint arXiv:2305.04790 2023 Bib PDF Code @article{gong2023multimodal, title = {Multimodal-gpt: A vision and language model for dialogue with humans}, author = {Gong, Tao and Lyu, Chengqi and Zhang, Shilong and Wang, Yudong and Zheng, Miao and Zhao, Qian and Liu, Kuikun and Zhang, Wenwei and Luo, Ping and Chen, Kai}, journal = {arXiv preprint arXiv:2305.04790}, year = {2023}, } TG-VQA: Ternary Game of Video Question Answering Hao Li, Peng Jin, Zesen Cheng, and 5 more authors In International Joint Conference on Artificial Intelligence (IJCAI) 2023 Bib PDF @inproceedings{li2023tg, title = {TG-VQA: Ternary Game of Video Question Answering}, author = {Li, Hao and Jin, Peng and Cheng, Zesen and Zhang, Songyang and Chen, Kai and Wang, Zhennan and Liu, Chang and Chen, Jie}, booktitle = {International Joint Conference on Artificial Intelligence (IJCAI)}, year = {2023}, } RIFormer: Keep Your Vision Backbone Effective But Removing Token Mixer Jiahao Wang, Songyang Zhang, Yong Liu, and 6 more authors In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) 2023 Bib PDF Code Website @inproceedings{wang2023riformer, title = {RIFormer: Keep Your Vision Backbone Effective But Removing Token Mixer}, author = {Wang, Jiahao and Zhang, Songyang and Liu, Yong and Wu, Taiqiang and Yang, Yujiu and Liu, Xihui and Chen, Kai and Luo, Ping and Lin, Dahua}, booktitle = {Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)}, year = {2023}, } Dense Distinct Query for End-to-End Object Detection Shilong Zhang, Jiaqi Wang, Jiangmiao Pang, and 4 more authors In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) 2023 Bib PDF Code @inproceedings{zhang2023dense, title = {Dense Distinct Query for End-to-End Object Detection}, author = {Zhang, Shilong and Wang, Jiaqi and Pang, Jiangmiao and Lyu, Chengqi and Zhang, Wenwei and Luo, Ping and Chen, Kai}, booktitle = {Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)}, year = {2023}, } Consistent-Teacher: Towards Reducing Inconsistent Pseudo-targets in Semi-supervised Object Detection Xinjiang Wang, Xingyi Yang, Shilong Zhang, and 6 more authors In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) 2023 Bib PDF Code @inproceedings{wang2023consistent, title = {Consistent-Teacher: Towards Reducing Inconsistent Pseudo-targets in Semi-supervised Object Detection}, author = {Wang, Xinjiang and Yang, Xingyi and Zhang, Shilong and Li, Yijiang and Feng, Litong and Fang, Shijie and Lyu, Chengqi and Chen, Kai and Zhang, Wayne}, booktitle = {Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)}, year = {2023}, } StructToken: Rethinking Semantic Segmentation with Structural Prior Fangjian Lin, Zhanhao Liang, Sitong Wu, and 3 more authors IEEE Transactions on Circuits and Systems for Video Technology (TCSVT) 2023 Bib PDF Code @article{lin2023structtoken, title = {StructToken: Rethinking Semantic Segmentation with Structural Prior}, author = {Lin, Fangjian and Liang, Zhanhao and Wu, Sitong and He, Junjun and Chen, Kai and Tian, Shengwei}, journal = {IEEE Transactions on Circuits and Systems for Video Technology (TCSVT)}, year = {2023}, publisher = {IEEE}, } Semantics-Aware Dynamic Localization and Refinement for Referring Image Segmentation Zhao Yang, Jiaqi Wang, Yansong Tang, and 3 more authors Proceedings of the AAAI Conference on Artificial Intelligence (AAAI) 2023 Bib PDF @article{yang2023semantics, title = {Semantics-Aware Dynamic Localization and Refinement for Referring Image Segmentation}, author = {Yang, Zhao and Wang, Jiaqi and Tang, Yansong and Chen, Kai and Zhao, Hengshuang and Torr, Philip H.S.}, journal = {Proceedings of the AAAI Conference on Artificial Intelligence (AAAI)}, year = {2023}, } Boosting Point Clouds Rendering via Radiance Mapping Xiaoyang Huang, Yi Zhang, Bingbing Ni, and 3 more authors Proceedings of the AAAI Conference on Artificial Intelligence (AAAI) 2023 Bib PDF Code @article{huang2023boosting, title = {Boosting Point Clouds Rendering via Radiance Mapping}, author = {Huang, Xiaoyang and Zhang, Yi and Ni, Bingbing and Li, Teng and Chen, Kai and Zhang, Wenjun}, journal = {Proceedings of the AAAI Conference on Artificial Intelligence (AAAI)}, year = {2023}, } 2022 RTMDet: An Empirical Study of Designing Real-Time Object Detectors Chengqi Lyu, Wenwei Zhang, Haian Huang, and 5 more authors arXiv preprint arXiv:2212.07784 2022 Bib PDF Code @article{lyu2022rtmdet, title = {RTMDet: An Empirical Study of Designing Real-Time Object Detectors}, author = {Lyu, Chengqi and Zhang, Wenwei and Huang, Haian and Zhou, Yue and Wang, Yudong and Liu, Yanyi and Zhang, Shilong and Chen, Kai}, journal = {arXiv preprint arXiv:2212.07784}, year = {2022}, } Deliberated Domain Bridging for Domain Adaptive Semantic Segmentation Lin Chen, Zhixiang Wei, Xin Jin, and 4 more authors Advances in Neural Information Processing Systems (NeurIPS) 2022 Bib PDF Code @article{chen2022deliberated, title = {Deliberated Domain Bridging for Domain Adaptive Semantic Segmentation}, author = {Chen, Lin and Wei, Zhixiang and Jin, Xin and Chen, Huaian and Zheng, Miao and Chen, Kai and Jin, Yi}, journal = {Advances in Neural Information Processing Systems (NeurIPS)}, year = {2022}, } Group R-CNN for Weakly Semi-supervised Object Detection with Points Shilong Zhang, Zhuoran Yu, Liyang Liu, and 3 more authors In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) 2022 Bib PDF Code @inproceedings{zhang2022group, title = {Group R-CNN for Weakly Semi-supervised Object Detection with Points}, author = {Zhang, Shilong and Yu, Zhuoran and Liu, Liyang and Wang, Xinjiang and Zhou, Aojun and Chen, Kai}, booktitle = {Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)}, pages = {9417--9426}, year = {2022}, } TransRank: Self-supervised Video Representation Learning via Ranking-based Transformation Recognition Haodong Duan, Nanxuan Zhao, Kai Chen, and 1 more author In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) 2022 Bib PDF Code @inproceedings{duan2022transrank, title = {TransRank: Self-supervised Video Representation Learning via Ranking-based Transformation Recognition}, author = {Duan, Haodong and Zhao, Nanxuan and Chen, Kai and Lin, Dahua}, booktitle = {Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)}, pages = {3000--3010}, year = {2022}, } Video K-Net: A Simple, Strong, and Unified Baseline for Video Segmentation Xiangtai Li, Wenwei Zhang, Jiangmiao Pang, and 4 more authors In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) 2022 Bib PDF Code @inproceedings{li2022video, title = {Video K-Net: A Simple, Strong, and Unified Baseline for Video Segmentation}, author = {Li, Xiangtai and Zhang, Wenwei and Pang, Jiangmiao and Chen, Kai and Cheng, Guangliang and Tong, Yunhai and Loy, Chen Change}, booktitle = {Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)}, pages = {18847--18857}, year = {2022}, } Dense Siamese Network Wenwei Zhang, Jiangmiao Pang, Kai Chen, and 1 more author European Conference on Computer Vision (ECCV) 2022 Bib PDF Code Website @article{zhang2022dense, title = {Dense Siamese Network}, author = {Zhang, Wenwei and Pang, Jiangmiao and Chen, Kai and Loy, Chen Change}, journal = {European Conference on Computer Vision (ECCV)}, year = {2022}, } Mitigating Representation Bias in Action Recognition: Algorithms and Benchmarks Haodong Duan, Yue Zhao, Kai Chen, and 2 more authors In European Conference on Computer Vision (ECCV) Workshop 2022 Bib PDF Code @inproceedings{duan2022mitigating, title = {Mitigating Representation Bias in Action Recognition: Algorithms and Benchmarks}, author = {Duan, Haodong and Zhao, Yue and Chen, Kai and Xiong, Yuanjun and Lin, Dahua}, booktitle = {European Conference on Computer Vision (ECCV) Workshop}, year = {2022}, organization = {Springer}, } OCSampler: Compressing Videos to One Clip with Single-step Sampling Jintao Lin, Haodong Duan, Kai Chen, and 2 more authors In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) 2022 Bib PDF Code @inproceedings{lin2022ocsampler, title = {OCSampler: Compressing Videos to One Clip with Single-step Sampling}, author = {Lin, Jintao and Duan, Haodong and Chen, Kai and Lin, Dahua and Wang, Limin}, booktitle = {Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)}, pages = {13894--13903}, year = {2022}, } LAVT: Language-Aware Vision Transformer for Referring Image Segmentation Zhao Yang, Jiaqi Wang, Yansong Tang, and 3 more authors In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) 2022 Bib PDF Code @inproceedings{yang2022lavt, title = {LAVT: Language-Aware Vision Transformer for Referring Image Segmentation}, author = {Yang, Zhao and Wang, Jiaqi and Tang, Yansong and Chen, Kai and Zhao, Hengshuang and Torr, Philip HS}, booktitle = {Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)}, pages = {18155--18165}, year = {2022}, } Pyskl: Towards good practices for skeleton action recognition Haodong Duan, Jiaqi Wang, Kai Chen, and 1 more author In Proceedings of the 30th ACM International Conference on Multimedia 2022 Bib PDF Code @inproceedings{duan2022pyskl, title = {Pyskl: Towards good practices for skeleton action recognition}, author = {Duan, Haodong and Wang, Jiaqi and Chen, Kai and Lin, Dahua}, booktitle = {Proceedings of the 30th ACM International Conference on Multimedia}, pages = {7351--7354}, year = {2022}, } MMRotate: A Rotated Object Detection Benchmark Using PyTorch Yue Zhou, Xue Yang, Gefan Zhang, and 9 more authors In Proceedings of the 30th ACM International Conference on Multimedia 2022 Bib PDF Code @inproceedings{zhou2022mmrotate, title = {MMRotate: A Rotated Object Detection Benchmark Using PyTorch}, author = {Zhou, Yue and Yang, Xue and Zhang, Gefan and Wang, Jiabao and Liu, Yanyi and Hou, Liping and Jiang, Xue and Liu, Xingzhao and Yan, Junchi and Lyu, Chengqi and Zhang, wenwei and Chen, Kai}, booktitle = {Proceedings of the 30th ACM International Conference on Multimedia}, year = {2022}, } Revisiting Skeleton-based Action Recognition Haodong Duan, Yue Zhao, Kai Chen, and 2 more authors In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) 2022 Bib PDF Code @inproceedings{duan2022revisiting, title = {Revisiting Skeleton-based Action Recognition}, author = {Duan, Haodong and Zhao, Yue and Chen, Kai and Lin, Dahua and Dai, Bo}, booktitle = {Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)}, pages = {2969--2978}, year = {2022}, } 2021 Few-Shot Object Detection via Association and DIscrimination Yuhang Cao, Jiaqi Wang, Ying Jin, and 4 more authors Advances in Neural Information Processing Systems (NeurIPS) 2021 Bib PDF Code @article{cao2021few, title = {Few-Shot Object Detection via Association and DIscrimination}, author = {Cao, Yuhang and Wang, Jiaqi and Jin, Ying and Wu, Tong and Chen, Kai and Liu, Ziwei and Lin, Dahua}, journal = {Advances in Neural Information Processing Systems (NeurIPS)}, volume = {34}, pages = {16570--16581}, year = {2021}, } MMOCR: A Comprehensive Toolbox for Text Detection, Recognition and Understanding Zhanghui Kuang, Hongbin Sun, Zhizhong Li, and 10 more authors In Proceedings of the 29th ACM International Conference on Multimedia 2021 Bib PDF Code @inproceedings{kuang2021mmocr, title = {MMOCR: A Comprehensive Toolbox for Text Detection, Recognition and Understanding}, author = {Kuang, Zhanghui and Sun, Hongbin and Li, Zhizhong and Yue, Xiaoyu and Lin, Tsui Hin and Chen, Jianyong and Wei, Huaqiang and Zhu, Yiqin and Gao, Tong and Zhang, Wenwei and Chen, Kai and Zhang, Wayne and Lin, Dahua}, booktitle = {Proceedings of the 29th ACM International Conference on Multimedia}, pages = {3791--3794}, year = {2021}, } K-Net: Towards Unified Image Segmentation Wenwei Zhang, Jiangmiao Pang, Kai Chen, and 1 more author Advances in Neural Information Processing Systems (NeurIPS) 2021 Bib PDF Code Website @article{zhang2021k, title = {K-Net: Towards Unified Image Segmentation}, author = {Zhang, Wenwei and Pang, Jiangmiao and Chen, Kai and Loy, Chen Change}, journal = {Advances in Neural Information Processing Systems (NeurIPS)}, volume = {34}, pages = {10326--10338}, year = {2021}, } Temporal ROI Align for Video Object Recognition Tao Gong, Kai Chen, Xinjiang Wang, and 5 more authors In Proceedings of the AAAI Conference on Artificial Intelligence (AAAI) 2021 Bib PDF Code @inproceedings{gong2021temporal, title = {Temporal ROI Align for Video Object Recognition}, author = {Gong, Tao and Chen, Kai and Wang, Xinjiang and Chu, Qi and Zhu, Feng and Lin, Dahua and Yu, Nenghai and Feng, Huamin}, booktitle = {Proceedings of the AAAI Conference on Artificial Intelligence (AAAI)}, volume = {35}, number = {2}, pages = {1442--1450}, year = {2021}, } Towards Balanced Learning for Instance Recognition Jiangmiao Pang, Kai Chen, Qi Li, and 5 more authors International Journal of Computer Vision (IJCV) 2021 Bib HTML @article{pang2021towards, title = {Towards Balanced Learning for Instance Recognition}, author = {Pang, Jiangmiao and Chen, Kai and Li, Qi and Xu, Zhihai and Feng, Huajun and Shi, Jianping and Ouyang, Wanli and Lin, Dahua}, journal = {International Journal of Computer Vision (IJCV)}, volume = {129}, number = {5}, pages = {1376--1393}, year = {2021}, publisher = {Springer US}, } CARAFE++: Unified Content-Aware ReAssembly of FEatures Jiaqi Wang, Kai Chen, Rui Xu, and 3 more authors IEEE Transactions on Pattern Analysis and Machine Intelligence (TPAMI) 2021 Bib PDF @article{wang2021carafe++, title = {CARAFE++: Unified Content-Aware ReAssembly of FEatures}, author = {Wang, Jiaqi and Chen, Kai and Xu, Rui and Liu, Ziwei and Loy, Chen Change and Lin, Dahua}, journal = {IEEE Transactions on Pattern Analysis and Machine Intelligence (TPAMI)}, year = {2021}, publisher = {IEEE}, } 2020 Seesaw Loss for Long-Tailed Instance Segmentation Jiaqi Wang, Wenwei Zhang, Yuhang Zang, and 7 more authors In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) 2020 Bib PDF Code @inproceedings{wang2020seesaw, title = {Seesaw Loss for Long-Tailed Instance Segmentation}, author = {Wang, Jiaqi and Zhang, Wenwei and Zang, Yuhang and Cao, Yuhang and Pang, Jiangmiao and Gong, Tao and Chen, Kai and Liu, Ziwei and Loy, Chen Change and Lin, Dahua}, booktitle = {Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)}, year = {2020}, } Positional Encoding as Spatial Inductive Bias in GANs Rui Xu, Xintao Wang, Kai Chen, and 2 more authors In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) 2020 Bib PDF Code Website @inproceedings{xu2020positional, title = {Positional Encoding as Spatial Inductive Bias in GANs}, author = {Xu, Rui and Wang, Xintao and Chen, Kai and Zhou, Bolei and Loy, Chen Change}, booktitle = {Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)}, year = {2020}, } Feature Pyramid Grids Kai Chen, Yuhang Cao, Chen Change Loy, and 2 more authors arXiv preprint arXiv:2004.03580 2020 Bib PDF Code @article{chen2020feature, title = {Feature Pyramid Grids}, author = {Chen, Kai and Cao, Yuhang and Loy, Chen Change and Lin, Dahua and Feichtenhofer, Christoph}, journal = {arXiv preprint arXiv:2004.03580}, year = {2020}, } Side-Aware Boundary Localization for More Precise Object Detection Jiaqi Wang, Wenwei Zhang, Yuhang Cao, and 6 more authors In European Conference on Computer Vision (ECCV) 2020 Bib PDF Code @inproceedings{wang2020side, title = {Side-Aware Boundary Localization for More Precise Object Detection}, author = {Wang, Jiaqi and Zhang, Wenwei and Cao, Yuhang and Chen, Kai and Pang, Jiangmiao and Gong, Tao and Shi, Jianping and Loy, Chen Change and Lin, Dahua}, booktitle = {European Conference on Computer Vision (ECCV)}, pages = {403--419}, year = {2020}, organization = {Springer, Cham}, } Prime sample attention in object detection Yuhang Cao, Kai Chen, Chen Change Loy, and 1 more author In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) 2020 Bib PDF Code @inproceedings{cao2020prime, title = {Prime sample attention in object detection}, author = {Cao, Yuhang and Chen, Kai and Loy, Chen Change and Lin, Dahua}, booktitle = {Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)}, pages = {11583--11591}, year = {2020}, } 2019 Libra R-CNN: Towards Balanced Learning for Object Detection Jiangmiao Pang, Kai Chen, Jianping Shi, and 3 more authors In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) 2019 Bib PDF Code @inproceedings{pang2019libra, title = {Libra R-CNN: Towards Balanced Learning for Object Detection}, author = {Pang, Jiangmiao and Chen, Kai and Shi, Jianping and Feng, Huajun and Ouyang, Wanli and Lin, Dahua}, booktitle = {Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)}, pages = {821--830}, year = {2019}, } Region Proposal by Guided Anchoring Jiaqi Wang*, Kai Chen*, Shuo Yang, and 2 more authors In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) 2019 Bib PDF Code @inproceedings{wang2019region, title = {Region Proposal by Guided Anchoring}, author = {Wang*, Jiaqi and Chen*, Kai and Yang, Shuo and Change Loy, Chen and Lin, Dahua}, booktitle = {Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)}, pages = {2965--2974}, year = {2019}, } Hybrid task cascade for instance segmentation Kai Chen, Jiangmiao Pang, Jiaqi Wang, and 9 more authors In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) 2019 Bib PDF Code @inproceedings{chen2019hybrid, title = {Hybrid task cascade for instance segmentation}, author = {Chen, Kai and Pang, Jiangmiao and Wang, Jiaqi and Xiong, Yu and Li, Xiaoxiao and Sun, Shuyang and Feng, Wansen and Liu, Ziwei and Shi, Jianping and Ouyang, Wanli and Loy, Chen Change and Lin, Dahua}, booktitle = {Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)}, pages = {4974--4983}, year = {2019}, } MMDetection: Open MMLab Detection Toolbox and Benchmark Kai Chen, Jiaqi Wang*, Jiangmiao Pang*, and 22 more authors arXiv preprint arXiv:1906.07155 2019 Bib PDF Code @article{chen2019mmdetection, title = {MMDetection: Open MMLab Detection Toolbox and Benchmark}, author = {Chen, Kai and Wang*, Jiaqi and Pang*, Jiangmiao and Cao, Yuhang and Xiong, Yu and Li, Xiaoxiao and Sun, Shuyang and Feng, Wansen and Liu, Ziwei and Xu, Jiarui and Zhang, Zheng and Cheng, Dazhi and Zhu, Chenchen and Cheng, Tianheng and Zhao, Qijie and Li, Buyu and Lu, Xin and Zhu, Rui and Wu, Yue and Dai, Jifeng and Wang, Jingdong and Shi, Jianping and Ouyang, Wanli and Loy, Chen Change and Lin, Dahua}, journal = {arXiv preprint arXiv:1906.07155}, year = {2019}, } CARAFE: Content-Aware ReAssembly of FEatures Jiaqi Wang, Kai Chen, Rui Xu, and 3 more authors In Proceedings of the IEEE International Conference on Computer Vision (ICCV) 2019 Bib PDF Code @inproceedings{wang2019carafe, title = {CARAFE: Content-Aware ReAssembly of FEatures}, author = {Wang, Jiaqi and Chen, Kai and Xu, Rui and Liu, Ziwei and Loy, Chen Change and Lin, Dahua}, booktitle = {Proceedings of the IEEE International Conference on Computer Vision (ICCV)}, year = {2019}, } 2018 Optimizing Video Object Detection via a Scale-Time Lattice Kai Chen, Jiaqi Wang, Shuo Yang, and 4 more authors In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) 2018 Bib PDF Website @inproceedings{chen2018optimizing, title = {Optimizing Video Object Detection via a Scale-Time Lattice}, author = {Chen, Kai and Wang, Jiaqi and Yang, Shuo and Zhang, Xingcheng and Xiong, Yuanjun and Loy, Chen Change and Lin, Dahua}, booktitle = {Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)}, pages = {7814--7823}, year = {2018}, } 2017 Video Object Segmentation with Re-identification Xiaoxiao Li, Yuankai Qi, Zhe Wang, and 6 more authors IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshop 2017 Bib PDF Website @article{li2017video, title = {Video Object Segmentation with Re-identification}, author = {Li, Xiaoxiao and Qi, Yuankai and Wang, Zhe and Chen, Kai and Liu, Ziwei and Shi, Jianping and Luo, Ping and Tang, Xiaoou and Loy, Chen Change}, journal = {IEEE Conference on Computer Vision and Pattern Recognition (CVPR) Workshop}, year = {2017}, } Discover and Learn New Objects from Documentaries Kai Chen, Hang Song, Chen Change Loy, and 1 more author In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) 2017 Bib PDF Website Dataset @inproceedings{chen2017discover, title = {Discover and Learn New Objects from Documentaries}, author = {Chen, Kai and Song, Hang and Loy, Chen Change and Lin, Dahua}, booktitle = {Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)}, year = {2017}, }