Publications | Kai Chen

2024

ANAH: Analytical Annotation of Hallucinations in Large Language Models

Ziwei Ji, Yuzhe Gu, Wenwei Zhang, and 3 more authors

In Proceedings of the Annual Meeting of the Association for Computational Linguistics (ACL), 2024

@inproceedings{ji2024anah,
  title = {ANAH: Analytical Annotation of Hallucinations in Large Language Models},
  author = {Ji, Ziwei and Gu, Yuzhe and Zhang, Wenwei and Lyu, Chengqi and Lin, Dahua and Chen, Kai},
  booktitle = {Proceedings of the Annual Meeting of the Association for Computational Linguistics (ACL)},
  year = {2024},
}

T-Eval: Evaluating the Tool Utilization Capability of Large Language Models Step by Step

Zehui Chen, Weihua Du, Wenwei Zhang, and 8 more authors

In Proceedings of the Annual Meeting of the Association for Computational Linguistics (ACL), 2024

Bib PDF Code Website

@inproceedings{chen2024t,
  title = {T-Eval: Evaluating the Tool Utilization Capability of Large Language Models Step by Step},
  author = {Chen, Zehui and Du, Weihua and Zhang, Wenwei and Liu, Kuikun and Liu, Jiangning and Zheng, Miao and Zhuo, Jingming and Zhang, Songyang and Lin, Dahua and Chen, Kai and Zhao, Feng},
  booktitle = {Proceedings of the Annual Meeting of the Association for Computational Linguistics (ACL)},
  year = {2024},
}

Agent-FLAN: Designing Data and Methods of Effective Agent Tuning for Large Language Models

Zehui Chen, Kuikun Liu, Qiuchen Wang, and 5 more authors

In Findings of the Association for Computational Linguistics: ACL, 2024

Bib PDF Code

@inproceedings{chen2024agent,
  title = {Agent-FLAN: Designing Data and Methods of Effective Agent Tuning for Large Language Models},
  author = {Chen, Zehui and Liu, Kuikun and Wang, Qiuchen and Zhang, Wenwei and Liu, Jiangning and Lin, Dahua and Chen, Kai and Zhao, Feng},
  booktitle = {Findings of the Association for Computational Linguistics: ACL},
  year = {2024},
}

LLaST: Improved End-to-end Speech Translation System Leveraged by Large Language Models

Xi Chen, Songyang Zhang, Qibing Bai, and 2 more authors

In Findings of the Association for Computational Linguistics: ACL, 2024

Bib

@inproceedings{chen2024llast,
  title = {LLaST: Improved End-to-end Speech Translation System Leveraged by Large Language Models},
  author = {Chen, Xi and Zhang, Songyang and Bai, Qibing and Chen, Kai and Nakamura, Satoshi},
  booktitle = {Findings of the Association for Computational Linguistics: ACL},
  year = {2024},
}

MathBench: Evaluating the Theory and Application Proficiency of LLMs with a Hierarchical Mathematics Benchmark

Hongwei Liu, Zilong Zheng, Yuxuan Qiao, and 7 more authors

In Findings of the Association for Computational Linguistics: ACL, 2024

Bib PDF Code

@inproceedings{liu2024mathbench,
  title = {MathBench: Evaluating the Theory and Application Proficiency of LLMs with a Hierarchical Mathematics Benchmark},
  author = {Liu, Hongwei and Zheng, Zilong and Qiao, Yuxuan and Duan, Haodong and Fei, Zhiwei and Zhou, Fengzhe and Zhang, Wenwei and Zhang, Songyang and Lin, Dahua and Chen, Kai},
  booktitle = {Findings of the Association for Computational Linguistics: ACL},
  year = {2024},
}

Differential Model Scaling using Differential Topk

Kai Liu, Ruohui Wang, Jianfei Gao, and 1 more author

In International Conference on Machine Learning (ICML), 2024

Bib

@inproceedings{liu2024differential,
  title = {Differential Model Scaling using Differential Topk},
  author = {Liu, Kai and Wang, Ruohui and Gao, Jianfei and Chen, Kai},
  booktitle = {International Conference on Machine Learning (ICML)},
  year = {2024},
}

Can AI Assistants Know What They Don’t Know?

Qinyuan Cheng, Tianxiang Sun, Xiangyang Liu, and 6 more authors

In International Conference on Machine Learning (ICML), 2024

Bib PDF Code

@inproceedings{cheng2024can,
  title = {Can AI Assistants Know What They Don't Know?},
  author = {Cheng, Qinyuan and Sun, Tianxiang and Liu, Xiangyang and Zhang, Wenwei and Yin, Zhangyue and Li, Shimin and Li, Linyang and Chen, Kai and Qiu, Xipeng},
  booktitle = {International Conference on Machine Learning (ICML)},
  year = {2024},
}

Ada-LEval: Evaluating long-context LLMs with length-adaptable benchmarks

Chonghua Wang, Haodong Duan, Songyang Zhang, and 2 more authors

In NAACL, 2024

Bib PDF Code

@inproceedings{wang2024ada,
  title = {Ada-LEval: Evaluating long-context LLMs with length-adaptable benchmarks},
  author = {Wang, Chonghua and Duan, Haodong and Zhang, Songyang and Lin, Dahua and Chen, Kai},
  booktitle = {NAACL},
  year = {2024},
}

BotChat: Evaluating LLMs’ Capabilities of Having Multi-Turn Dialogues

Haodong Duan, Jueqi Wei, Chonghua Wang, and 5 more authors

In NAACL findings, 2024

Bib PDF Code

@inproceedings{duan2023botchat,
  title = {BotChat: Evaluating LLMs' Capabilities of Having Multi-Turn Dialogues},
  author = {Duan, Haodong and Wei, Jueqi and Wang, Chonghua and Liu, Hongwei and Fang, Yixiao and Zhang, Songyang and Lin, Dahua and Chen, Kai},
  booktitle = {NAACL findings},
  year = {2024},
}