{"id":"https://openalex.org/W7092292881","doi":"https://doi.org/10.48550/arxiv.2510.13898","title":"Attribution Quality in AI-Generated Content:Benchmarking Style Embeddings and LLM Judges","display_name":"Attribution Quality in AI-Generated Content:Benchmarking Style Embeddings and LLM Judges","publication_year":2025,"publication_date":"2025-10-14","ids":{"openalex":"https://openalex.org/W7092292881","doi":"https://doi.org/10.48550/arxiv.2510.13898"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2510.13898","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2510.13898","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2510.13898","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Abbas, Misam","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Abbas, Misam","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.8409000039100647,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12380","display_name":"Authorship Attribution and Profiling","score":0.8409000039100647,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.03480000048875809,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.0340999998152256,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/attribution","display_name":"Attribution","score":0.7843000292778015},{"id":"https://openalex.org/keywords/continuation","display_name":"Continuation","score":0.7706000208854675},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7556999921798706},{"id":"https://openalex.org/keywords/style","display_name":"Style (visual arts)","score":0.7093999981880188},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.6011999845504761},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.5795000195503235},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.579200029373169},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5758000016212463}],"concepts":[{"id":"https://openalex.org/C143299363","wikidata":"https://www.wikidata.org/wiki/Q900584","display_name":"Attribution","level":2,"score":0.7843000292778015},{"id":"https://openalex.org/C88626702","wikidata":"https://www.wikidata.org/wiki/Q1128903","display_name":"Continuation","level":2,"score":0.7706000208854675},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7556999921798706},{"id":"https://openalex.org/C2776445246","wikidata":"https://www.wikidata.org/wiki/Q1792644","display_name":"Style (visual arts)","level":2,"score":0.7093999981880188},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6284000277519226},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.6011999845504761},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.5795000195503235},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.579200029373169},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5758000016212463},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5340999960899353},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5105000138282776},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.4602000117301941},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.45660001039505005},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.38260000944137573},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.33399999141693115},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.3183000087738037},{"id":"https://openalex.org/C3020202489","wikidata":"https://www.wikidata.org/wiki/Q2032038","display_name":"Authorship attribution","level":2,"score":0.31679999828338623},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.298799991607666},{"id":"https://openalex.org/C2780876879","wikidata":"https://www.wikidata.org/wiki/Q3054749","display_name":"Meaning (existential)","level":2,"score":0.28700000047683716},{"id":"https://openalex.org/C2776230583","wikidata":"https://www.wikidata.org/wiki/Q1322198","display_name":"Spoken language","level":2,"score":0.2867000102996826},{"id":"https://openalex.org/C4679612","wikidata":"https://www.wikidata.org/wiki/Q866298","display_name":"Aggregate (composite)","level":2,"score":0.2842000126838684},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.2816999852657318},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.2809999883174896},{"id":"https://openalex.org/C189950617","wikidata":"https://www.wikidata.org/wiki/Q937228","display_name":"Property (philosophy)","level":2,"score":0.2736999988555908},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.2685000002384186}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2510.13898","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2510.13898","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2510.13898","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2510.13898","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.8858913779258728}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Attributing":[0],"authorship":[1],"in":[2,127,138,187],"the":[3,36,103,115,122,173],"era":[4],"of":[5,44,194],"large":[6],"language":[7],"models":[8],"(LLMs)":[9],"is":[10,99],"increasingly":[11],"challenging":[12],"as":[13,151],"machine-generated":[14],"prose":[15],"rivals":[16],"human":[17,64],"writing.":[18],"We":[19],"benchmark":[20,182],"two":[21],"complementary":[22,147],"attribution":[23,150,184],"mechanisms":[24],",":[25],"fixed":[26],"Style":[27,81,104],"Embeddings":[28],"and":[29,57,71,129,140,166],"an":[30,41,72],"instruction-tuned":[31],"LLM":[32,97,123],"judge":[33,124],"(GPT-4o)":[34],"on":[35,88,106,164,169],"Human":[37],"AI":[38],"Parallel":[39],"Corpus,":[40],"open":[42,177],"dataset":[43],"600":[45],"balanced":[46],"instances":[47],"spanning":[48],"six":[49],"domains":[50],"(academic,":[51],"news,":[52],"fiction,":[53],"blogs,":[54],"spoken":[55,139],"transcripts,":[56],"TV/movie":[58],"scripts).":[59],"Each":[60],"instance":[61],"contains":[62],"a":[63,68,152,180,192],"prompt":[65],"with":[66,191],"both":[67],"gold":[69],"continuation":[70,74],"LLM-generated":[73],"from":[75],"either":[76],"GPT-4o":[77],"or":[78],"LLaMA-70B-Instruct.":[79],"The":[80,96],"Embedding":[82],"baseline":[83],"achieves":[84],"stronger":[85],"aggregate":[86],"accuracy":[87],"GPT":[89],"continuations":[90,108],"(82":[91],"pct":[92,110],"vs.":[93,111],"68":[94],"pct).":[95],"Judge":[98],"slightly":[100],"better":[101],"than":[102],"embeddings":[105,136],"LLaMA":[107],"(85":[109],"81":[112],"pct)":[113],"but":[114],"results":[116],"are":[117],"not":[118],"statistically":[119],"significant.":[120],"Crucially,":[121],"significantly":[125],"outperforms":[126],"fiction":[128],"academic":[130],"prose,":[131],"indicating":[132],"semantic":[133],"sensitivity,":[134],"whereas":[135],"dominate":[137],"scripted":[141],"dialogue,":[142],"reflecting":[143],"structural":[144],"strengths.":[145],"These":[146],"patterns":[148],"highlight":[149],"multidimensional":[153],"problem":[154],"requiring":[155],"hybrid":[156],"strategies.":[157],"To":[158],"support":[159],"reproducibility":[160],"we":[161],"provide":[162],"code":[163],"GitHub":[165],"derived":[167],"data":[168],"Hugging":[170],"Face":[171],"under":[172],"MIT":[174],"license.":[175],"This":[176],"framework":[178],"provides":[179],"reproducible":[181],"for":[183],"quality":[185],"assessment":[186],"AI-generated":[188],"content,":[189],"along":[190],"review":[193],"related":[195],"literature":[196],"influencing":[197],"this":[198],"work.":[199]},"counts_by_year":[],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-18T00:00:00"}
