{"id":"https://openalex.org/W4283208995","doi":"https://doi.org/10.1109/infocomwkshps54753.2022.9798377","title":"REGRETS: A New Corpus of Regrettable (Self-)Disclosures on Social Media","display_name":"REGRETS: A New Corpus of Regrettable (Self-)Disclosures on Social Media","publication_year":2022,"publication_date":"2022-05-02","ids":{"openalex":"https://openalex.org/W4283208995","doi":"https://doi.org/10.1109/infocomwkshps54753.2022.9798377"},"language":"en","primary_location":{"id":"doi:10.1109/infocomwkshps54753.2022.9798377","is_oa":false,"landing_page_url":"https://doi.org/10.1109/infocomwkshps54753.2022.9798377","pdf_url":null,"source":{"id":"https://openalex.org/S4363607985","display_name":"IEEE INFOCOM 2022 - IEEE Conference on Computer Communications Workshops (INFOCOM WKSHPS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE INFOCOM 2022 - IEEE Conference on Computer Communications Workshops (INFOCOM WKSHPS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5069006785","display_name":"Hervais Simo","orcid":null},"institutions":[{"id":"https://openalex.org/I4210133470","display_name":"Fraunhofer Institute for Secure Information Technology","ror":"https://ror.org/03qt2gs44","country_code":"DE","type":"facility","lineage":["https://openalex.org/I4210133470","https://openalex.org/I4923324"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Hervais Simo","raw_affiliation_strings":["Fraunhofer SIT,Darmstadt,Germany","Fraunhofer SIT, Darmstadt, Germany"],"affiliations":[{"raw_affiliation_string":"Fraunhofer SIT,Darmstadt,Germany","institution_ids":["https://openalex.org/I4210133470"]},{"raw_affiliation_string":"Fraunhofer SIT, Darmstadt, Germany","institution_ids":["https://openalex.org/I4210133470"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5027434434","display_name":"Michael Kreutzer","orcid":"https://orcid.org/0000-0003-0748-7707"},"institutions":[{"id":"https://openalex.org/I4210133470","display_name":"Fraunhofer Institute for Secure Information Technology","ror":"https://ror.org/03qt2gs44","country_code":"DE","type":"facility","lineage":["https://openalex.org/I4210133470","https://openalex.org/I4923324"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Michael Kreutzer","raw_affiliation_strings":["Fraunhofer SIT,Darmstadt,Germany","Fraunhofer SIT, Darmstadt, Germany"],"affiliations":[{"raw_affiliation_string":"Fraunhofer SIT,Darmstadt,Germany","institution_ids":["https://openalex.org/I4210133470"]},{"raw_affiliation_string":"Fraunhofer SIT, Darmstadt, Germany","institution_ids":["https://openalex.org/I4210133470"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5069006785"],"corresponding_institution_ids":["https://openalex.org/I4210133470"],"apc_list":null,"apc_paid":null,"fwci":0.3116,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.48486318,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"2"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12262","display_name":"Hate Speech and Cyberbullying Detection","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11147","display_name":"Misinformation and Its Impacts","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11644","display_name":"Spam and Phishing Detection","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7408468723297119},{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.7045501470565796},{"id":"https://openalex.org/keywords/regret","display_name":"Regret","score":0.7026709318161011},{"id":"https://openalex.org/keywords/offensive","display_name":"Offensive","score":0.5873466730117798},{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.5313591957092285},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.4813114404678345},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4221181869506836},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4216192960739136},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.36251333355903625},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.35519281029701233},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.32866325974464417},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.22029805183410645}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7408468723297119},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.7045501470565796},{"id":"https://openalex.org/C50817715","wikidata":"https://www.wikidata.org/wiki/Q79895177","display_name":"Regret","level":2,"score":0.7026709318161011},{"id":"https://openalex.org/C176856949","wikidata":"https://www.wikidata.org/wiki/Q2001676","display_name":"Offensive","level":2,"score":0.5873466730117798},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.5313591957092285},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.4813114404678345},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4221181869506836},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4216192960739136},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.36251333355903625},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.35519281029701233},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.32866325974464417},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.22029805183410645},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/infocomwkshps54753.2022.9798377","is_oa":false,"landing_page_url":"https://doi.org/10.1109/infocomwkshps54753.2022.9798377","pdf_url":null,"source":{"id":"https://openalex.org/S4363607985","display_name":"IEEE INFOCOM 2022 - IEEE Conference on Computer Communications Workshops (INFOCOM WKSHPS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE INFOCOM 2022 - IEEE Conference on Computer Communications Workshops (INFOCOM WKSHPS)","raw_type":"proceedings-article"},{"id":"pmh:oai:publica.fraunhofer.de:publica/418790","is_oa":false,"landing_page_url":"https://publica.fraunhofer.de/handle/publica/418790","pdf_url":null,"source":{"id":"https://openalex.org/S4306400318","display_name":"Fraunhofer-Publica (Fraunhofer-Gesellschaft)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4923324","host_organization_name":"Fraunhofer-Gesellschaft","host_organization_lineage":["https://openalex.org/I4923324"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"conference paper"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.6000000238418579,"display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320311687","display_name":"Ministry of Education","ror":"https://ror.org/03m01yf64"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":6,"referenced_works":["https://openalex.org/W1614298861","https://openalex.org/W1993722065","https://openalex.org/W2101210369","https://openalex.org/W2343252634","https://openalex.org/W6636510571","https://openalex.org/W6704698082"],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2971351794","https://openalex.org/W4376155396","https://openalex.org/W1568520348","https://openalex.org/W3214407891","https://openalex.org/W1947085858","https://openalex.org/W3194113117","https://openalex.org/W4287020359","https://openalex.org/W3213194066","https://openalex.org/W268355439"],"abstract_inverted_index":{"In":[0,47],"the":[1,34,51,75,111,113,166,239,244,251,254],"past":[2],"few":[3],"years,":[4],"researchers":[5],"have":[6],"shown":[7],"a":[8,43,49,60,180,193],"growing":[9,66],"interest":[10],"in":[11,128,134],"techniques":[12],"for":[13,168,172,183],"automated":[14,173],"detection":[15,174],"of":[16,30,36,77,80,115,149,158,175,197,218,241,246,253],"regrettable":[17,40,81,94,200],"disclosures":[18,41],"(things":[19],"people":[20],"wish":[21],"they":[22],"had":[23],"not":[24],"shared)":[25],"on":[26,59,86,110,215,235],"social":[27,87,142,220,229,247],"media.":[28,88],"Most":[29],"these":[31],"proposals":[32],"formulate":[33],"task":[35],"automatically":[37],"detecting":[38],"potentially":[39],"as":[42,100,154,261],"supervised":[44],"classification":[45,53],"problem.":[46],"such":[48,99],"setting,":[50],"underlying":[52],"model":[54],"is":[55,161],"trained":[56],"and":[57,83,104,117,136,145,187,203,250],"validate":[58],"dataset":[61],"labeled":[62],"accordingly.":[63],"However,":[64],"despite":[65],"efforts,":[67],"existing":[68],"approaches":[69],"remain":[70],"limited,":[71],"partly":[72,242],"due":[73],"to":[74,92,123,162,263],"lack":[76],"high-quality":[78,206],"corpus":[79,196,217],"messages":[82],"comments":[84,204],"shared":[85],"Previous":[89],"work":[90,130],"tend":[91],"confuse":[93],"disclosure":[95,118],"with":[96,205],"related":[97],"concepts":[98],"hate":[101],"speech,":[102],"profanity":[103],"offensive":[105],"language,":[106],"ignoring":[107],"empirical":[108],"findings":[109,260],"reasons,":[112],"types":[114],"contents,":[116],"contexts":[119],"that":[120,237],"often":[121],"lead":[122],"regrets.":[124],"Moreover,":[125],"corpora":[126],"used":[127,153],"prior":[129],"are":[131],"typically":[132],"limited":[133],"size":[135],"w.r.t.":[137],"their":[138],"source":[139],"domains":[140],"(i.e.,":[141,147],"media":[143,221,230,248],"platforms)":[144],"scope":[146],"range":[148],"regret-related":[150,176],"topical":[151],"content":[152],"labels).":[155],"The":[156],"goal":[157],"this":[159],"paper":[160],"contribute":[163],"towards":[164],"lowering":[165],"barrier":[167],"developing":[169],"effective":[170],"systems":[171],"posts.":[177],"We":[178,190,257],"propose":[179,210],"novel":[181],"methodology":[182],"large-scale":[184,195],"data":[185],"collection":[186],"semi-automated":[188],"annotation.":[189],"introduce":[191],"REGRETS,":[192],"new":[194],"4,7":[198],"million":[199],"text-only":[201],"posts":[202],"annotations.":[207],"Further,":[208],"we":[209,233],"regret-specific":[211],"embeddings":[212],"models":[213],"pre-trained":[214],"our":[216,259],"user-generated":[219],"texts":[222],"which":[223],"were":[224],"extracted":[225],"from":[226],"various":[227],"popular":[228],"ecosystems.":[231],"Lastly,":[232],"report":[234],"analyses":[236],"demonstrate":[238],"feasibility":[240],"automating":[243],"annotation":[245],"texts,":[249],"richness":[252],"resulting":[255],"corpus.":[256],"release":[258],"resources":[262],"facilitate":[264],"further":[265],"interdisciplinary":[266],"research:":[267],"https://bit.ly/3fO36Ex.":[268]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
