[{"data":1,"prerenderedAt":-1},["ShallowReactive",2],{"doc-detail-32245":3,"doc-seo-32245":27},{"code":4,"msg":5,"data":6},0,"success",{"doc_id":7,"user_id":8,"nickname":9,"user_avatar":10,"doc_module":4,"category_id":11,"category_name":12,"doc_title":13,"doc_description":14,"file_id":15,"file_url":16,"file_type":17,"file_size":18,"view_count":4,"is_deleted":4,"is_public":19,"is_downloadable":19,"audit_status":19,"page_count":20,"language":21,"language_code":22,"table_of_contents":23,"faqs":24,"seo_title":13,"seo_description":14,"update_tm":25,"read_time":26},32245,962075006959,"Anda","https://ap-avatar.wpscdn.com/avatar/e0002397efbe92a78e?_k=1776741047341049297",8,"Research & Report","LLM Content Moderation and User Satisfaction: Evidence from Response Refusals in Chatbot Arena","LLM safety and ethical alignment remain widely discussed, while the effect of content moderation on user satisfaction is still underexplored. Analyzing nearly 50,000 model comparisons from Chatbot Arena, this work studies how users react when models refuse prompts. A RoBERTa-based refusal classifier separates ethical refusals from technical limitations. Results show a substantial refusal penalty: ethical refusals receive lower win rates than technical refusals and standard responses. The penalty varies with prompt sensitivity and refusal phrasing, highlighting a safety-versus-expectations tension.","cbCaip4vV3emTlQh","https://ap.wps.com/l/cbCaip4vV3emTlQh","pdf",1019761,1,29,"English","en","# Introduction\n## Background and motivation\n## Research questions\n## Approach and dataset","[{\"question\":\"What gap does the paper address about LLM safety and moderation?\",\"answer\":\"The paper targets how content moderation via refusal behavior affects user satisfaction, which has received less direct study than system-level refusal optimization.\"},{\"question\":\"How does the study distinguish ethical refusals from technical limitations?\",\"answer\":\"It fine-tunes a RoBERTa-based refusal classifier on a hand-labeled dataset to classify different refusal causes.\"},{\"question\":\"What overall effect do ethical refusals have on user preferences?\",\"answer\":\"Ethical refusals incur a substantial penalty, producing significantly lower win rates than technical refusals and standard responses.\"}]",1781039546,73,{"code":4,"msg":28,"data":29},"ok",{"site_id":30,"language":22,"slug":31,"title":13,"keywords":32,"description":14,"schema_data":33,"social_meta":84,"head_meta":86,"extra_data":88,"updated_unix":25},105,"llm-content-moderation-and-user-satisfaction-evidence-from-response-refusals-in-chatbot-arena","",{"@graph":34,"@context":83},[35,52,66],{"@type":36,"itemListElement":37},"BreadcrumbList",[38,42,46,49],{"item":39,"name":40,"@type":41,"position":19},"https://docshare.wps.com","Home","ListItem",{"item":43,"name":44,"@type":41,"position":45},"https://docshare.wps.com/document/","Document",2,{"item":47,"name":12,"@type":41,"position":48},"https://docshare.wps.com/document/research-report/",3,{"item":50,"name":13,"@type":41,"position":51},"https://docshare.wps.com/document/llm-content-moderation-and-user-satisfaction-evidence-from-response-refusals-in-chatbot-arena/32245/",4,{"url":50,"name":13,"@type":53,"author":54,"headline":13,"publisher":56,"fileFormat":59,"description":14,"dateModified":60,"datePublished":60,"encodingFormat":59,"isAccessibleForFree":61,"interactionStatistic":62},"DigitalDocument",{"name":9,"@type":55},"Person",{"url":39,"name":57,"@type":58},"DocShare","Organization","application/pdf","2026-06-09",true,{"@type":63,"interactionType":64,"userInteractionCount":4},"InteractionCounter",{"@type":65},"ViewAction",{"@type":67,"mainEntity":68},"FAQPage",[69,75,79],{"name":70,"@type":71,"acceptedAnswer":72},"What gap does the paper address about LLM safety and moderation?","Question",{"text":73,"@type":74},"The paper targets how content moderation via refusal behavior affects user satisfaction, which has received less direct study than system-level refusal optimization.","Answer",{"name":76,"@type":71,"acceptedAnswer":77},"How does the study distinguish ethical refusals from technical limitations?",{"text":78,"@type":74},"It fine-tunes a RoBERTa-based refusal classifier on a hand-labeled dataset to classify different refusal causes.",{"name":80,"@type":71,"acceptedAnswer":81},"What overall effect do ethical refusals have on user preferences?",{"text":82,"@type":74},"Ethical refusals incur a substantial penalty, producing significantly lower win rates than technical refusals and standard responses.","https://schema.org",{"og:url":50,"og:type":85,"og:title":13,"og:site_name":57,"og:description":14},"article",{"robots":87,"canonical":50},"index,follow",{"doc_id":7,"site_id":30}]