@inproceedings{455265b9d47742528b675cfbe67ace0b,
title = "GUIDELLM: Exploring LLM-Guided Conversation with Applications in Autobiography Interviewing",
abstract = "Although Large Language Models (LLMs) succeed in human-guided conversations such as instruction following and question answering, the potential of LLM-guided conversations-where LLMs direct the discourse and steer the conversation's objectives-remains under-explored. In this study, we first characterize LLM-guided conversation into three fundamental components: (i) Goal Navigation; (ii) Context Management; (iii) Empathetic Engagement, and propose GUIDELLM as an installation. We then implement an interviewing environment for the evaluation of LLM-guided conversation. Specifically, various topics are involved in this environment for comprehensive interviewing evaluation, resulting in around 1.4k turns of utterances, 184k tokens, and over 200 events mentioned during the interviewing for each chatbot evaluation. We compare GUIDELLM with 6 state-of-the-art LLMs such as GPT-4o and Llama-3-70bInstruct, from the perspective of interviewing quality, and autobiography generation quality. For automatic evaluation, we derive user proxies from multiple autobiographies and employ LLM-as-a-judge to score LLM behaviors. We further conduct a human-involved experiment by employing 45 human participants to chat with GUIDELLM and baselines. We then collect human feedback, preferences, and ratings regarding the qualities of conversation and autobiography. Experimental results indicate that GUIDELLM significantly outperforms baseline LLMs in automatic evaluation and achieves consistent leading performances in human ratings.",
author = "Jinhao Duan and Xinyu Zhao and Zhuoxuan Zhang and Eunhye Ko and Lily Boddy and Chenan Wang and Tianhao Li and Alexander Rasgon and Junyuan Hong and Lee, \{Min Kyung\} and Chenxi Yuan and Qi Long and Ying Ding and Tianlong Chen and Kaidi Xu",
note = "Publisher Copyright: {\textcopyright} 2025 Association for Computational Linguistics.; 2025 Annual Conference of the Nations of the Americas Chapter of the Association for Computational Linguistics: Human Language Technologies, NAACL-HLT 2025 ; Conference date: 29-04-2025 Through 04-05-2025",
year = "2025",
doi = "10.18653/v1/2025.naacl-long.287",
language = "English (US)",
series = "Proceedings of the 2025 Annual Conference of the Nations of the Americas Chapter of the Association for Computational Linguistics: Human Language Technologies: Long Papers, NAACL-HLT 2025",
publisher = "Association for Computational Linguistics (ACL)",
pages = "5558--5588",
editor = "Luis Chiruzzo and Alan Ritter and Lu Wang",
booktitle = "Long Papers",
address = "United States",
}