@inproceedings{d4ba2d46aed54ab18cd6d3d355df5883,
title = "An Interactive Evaluation Framework for Empathetic Response Generation",
abstract = "Empathetic response generation is a significant domain in Natural Language Processing (NLP). Its development is a critical step toward achieving humanized AI systems. However, current evaluations of empathetic dialogue models are primarily single-turn and static, leading to bias between evaluation results and real-world multi-turn interaction performance. To overcome the longstanding challenge, we propose a novel Interactive Empathy Evaluation Framework (IEEF). It eliminates the bias by facilitating a human-free multi-turn interaction evaluation. Specifically, for human-free interaction, we design a user simulator using reinforcement learning, leveraging a reward model based on LLM scoring. For evalution, we introduce a series of empathy-related metrics based on LLM. The experiments show that IEEF's evaluation results are highly correlated with real-world multi-turn interaction performance, demonstrating its alignment with human preferences in empathy evaluation.",
keywords = "Dialogue System, Empathetic Dialogue, Empathy Metrics, LLM Scoring, Natural Language Processing",
author = "Xixi Lei and Changqun Li and Liang He and Xin Lin",
note = "Publisher Copyright: {\textcopyright} 2025 IEEE.; 2025 IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2025 ; Conference date: 06-04-2025 Through 11-04-2025",
year = "2025",
doi = "10.1109/ICASSP49660.2025.10887960",
language = "英语",
series = "ICASSP, IEEE International Conference on Acoustics, Speech and Signal Processing - Proceedings",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
editor = "Rao, \{Bhaskar D\} and Isabel Trancoso and Gaurav Sharma and Mehta, \{Neelesh B.\}",
booktitle = "2025 IEEE International Conference on Acoustics, Speech, and Signal Processing, ICASSP 2025 - Proceedings",
address = "美国",
}