{"id":"https://openalex.org/W4387995378","doi":"https://doi.org/10.48550/arxiv.2310.17389","title":"ToxicChat: Unveiling Hidden Challenges of Toxicity Detection in Real-World User-AI Conversation","display_name":"ToxicChat: Unveiling Hidden Challenges of Toxicity Detection in Real-World User-AI Conversation","publication_year":2023,"publication_date":"2023-10-26","ids":{"openalex":"https://openalex.org/W4387995378","doi":"https://doi.org/10.48550/arxiv.2310.17389"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2310.17389","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2310.17389","pdf_url":"https://arxiv.org/pdf/2310.17389","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2310.17389","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103777591","display_name":"Lin Zi","orcid":"https://orcid.org/0009-0008-0052-2817"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Lin, Zi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100380102","display_name":"Zihan Wang","orcid":"https://orcid.org/0009-0006-1175-6163"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Zihan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010726742","display_name":"Yongqi Tong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tong, Yongqi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015179224","display_name":"Yangkun Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yangkun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023758850","display_name":"Yuxin Guo","orcid":"https://orcid.org/0000-0002-6082-4218"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guo, Yuxin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100767801","display_name":"Yujia Wang","orcid":"https://orcid.org/0000-0002-6733-4967"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yujia","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5039500313","display_name":"Jingbo Shang","orcid":"https://orcid.org/0000-0002-7249-4404"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shang, Jingbo","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5103777591"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9606999754905701,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13629","display_name":"Text Readability and Simplification","score":0.9469000101089478,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6890177726745605},{"id":"https://openalex.org/keywords/conversation","display_name":"Conversation","score":0.685736358165741},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6820207238197327},{"id":"https://openalex.org/keywords/chatbot","display_name":"Chatbot","score":0.5739346742630005},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.5631316304206848},{"id":"https://openalex.org/keywords/open-domain","display_name":"Open domain","score":0.49026253819465637},{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.4493095874786377},{"id":"https://openalex.org/keywords/resource","display_name":"Resource (disambiguation)","score":0.4413872957229614},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.43997058272361755},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.40549516677856445},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.3375069200992584},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.28400591015815735},{"id":"https://openalex.org/keywords/question-answering","display_name":"Question answering","score":0.08061468601226807}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6890177726745605},{"id":"https://openalex.org/C2777200299","wikidata":"https://www.wikidata.org/wiki/Q52943","display_name":"Conversation","level":2,"score":0.685736358165741},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6820207238197327},{"id":"https://openalex.org/C2779041454","wikidata":"https://www.wikidata.org/wiki/Q870780","display_name":"Chatbot","level":2,"score":0.5739346742630005},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.5631316304206848},{"id":"https://openalex.org/C2993776861","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Open domain","level":3,"score":0.49026253819465637},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.4493095874786377},{"id":"https://openalex.org/C206345919","wikidata":"https://www.wikidata.org/wiki/Q20380951","display_name":"Resource (disambiguation)","level":2,"score":0.4413872957229614},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.43997058272361755},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.40549516677856445},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.3375069200992584},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.28400591015815735},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.08061468601226807},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2310.17389","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2310.17389","pdf_url":"https://arxiv.org/pdf/2310.17389","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},{"id":"doi:10.48550/arxiv.2310.17389","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2310.17389","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article-journal"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2310.17389","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2310.17389","pdf_url":"https://arxiv.org/pdf/2310.17389","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":null},"sustainable_development_goals":[{"score":0.7200000286102295,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W3176963395","https://openalex.org/W4287887667","https://openalex.org/W2947270058","https://openalex.org/W2950299257","https://openalex.org/W4312591757","https://openalex.org/W4297969376","https://openalex.org/W2984132767","https://openalex.org/W2939728130","https://openalex.org/W3127222075","https://openalex.org/W3094899196"],"abstract_inverted_index":{"Despite":[0],"remarkable":[1],"advances":[2],"that":[3,75],"large":[4],"language":[5],"models":[6,83,100],"have":[7,28],"achieved":[8],"in":[9,25,128],"chatbots,":[10],"maintaining":[11],"a":[12,56,87,138,147],"non-toxic":[13],"user-AI":[14,46,130,153],"interactive":[15],"environment":[16,151],"has":[17,106],"become":[18],"increasingly":[19],"critical":[20],"nowadays.":[21],"However,":[22],"previous":[23],"efforts":[24],"toxicity":[26,81,104,126],"detection":[27,82,127],"been":[29],"mostly":[30],"based":[31,59],"on":[32,60,102],"benchmarks":[33],"derived":[34],"from":[35,64],"social":[36,93],"media":[37,94],"content,":[38],"leaving":[39],"the":[40,71,121,133],"unique":[41,114],"challenges":[42,124],"inherent":[43],"to":[44,84,92,112,141],"real-world":[45,129],"interactions":[47],"insufficiently":[48],"explored.":[49],"In":[50,132],"this":[51,113],"work,":[52],"we":[53],"introduce":[54],"ToxicChat,":[55],"novel":[57],"benchmark":[58,69],"real":[61],"user":[62],"queries":[63],"an":[65],"open-source":[66],"chatbot.":[67],"This":[68],"contains":[70],"rich,":[72],"nuanced":[73],"phenomena":[74],"can":[76,136],"be":[77,137],"tricky":[78],"for":[79,152],"current":[80],"identify,":[85],"revealing":[86],"significant":[88],"domain":[89,115],"difference":[90],"compared":[91],"content.":[95],"Our":[96,118],"systematic":[97],"evaluation":[98],"of":[99,116,125],"trained":[101],"existing":[103],"datasets":[105],"shown":[107],"their":[108],"shortcomings":[109],"when":[110],"applied":[111],"ToxicChat.":[117],"work":[119],"illuminates":[120],"potentially":[122],"overlooked":[123],"conversations.":[131],"future,":[134],"ToxicChat":[135],"valuable":[139],"resource":[140],"drive":[142],"further":[143],"advancements":[144],"toward":[145],"building":[146],"safe":[148],"and":[149],"healthy":[150],"interactions.":[154]},"counts_by_year":[],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2023-10-28T00:00:00"}
