{"id":"https://openalex.org/W4415937783","doi":"https://doi.org/10.1140/epjds/s13688-026-00647-0","title":"Remembering unequally: global and disciplinary bias in LLM reconstruction of scholarly coauthor lists","display_name":"Remembering unequally: global and disciplinary bias in LLM reconstruction of scholarly coauthor lists","publication_year":2026,"publication_date":"2026-04-20","ids":{"openalex":"https://openalex.org/W4415937783","doi":"https://doi.org/10.1140/epjds/s13688-026-00647-0"},"language":"en","primary_location":{"id":"doi:10.1140/epjds/s13688-026-00647-0","is_oa":true,"landing_page_url":"https://doi.org/10.1140/epjds/s13688-026-00647-0","pdf_url":"https://link.springer.com/content/pdf/10.1140/epjds/s13688-026-00647-0.pdf","source":{"id":"https://openalex.org/S2504380752","display_name":"EPJ Data Science","issn_l":"2193-1127","issn":["2193-1127"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EPJ Data Science","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref","datacite","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://link.springer.com/content/pdf/10.1140/epjds/s13688-026-00647-0.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5085285061","display_name":"Ghazal Kalhor","orcid":"https://orcid.org/0000-0002-6153-9048"},"institutions":[{"id":"https://openalex.org/I23946033","display_name":"University of Tehran","ror":"https://ror.org/05vf56z40","country_code":"IR","type":"education","lineage":["https://openalex.org/I23946033"]}],"countries":["IR"],"is_corresponding":true,"raw_author_name":"Ghazal Kalhor","raw_affiliation_strings":["School of Electrical and Computer Engineering, College of Engineering, University of Tehran, Tehran, Iran"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Electrical and Computer Engineering, College of Engineering, University of Tehran, Tehran, Iran","institution_ids":["https://openalex.org/I23946033"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5061449471","display_name":"Afra Mashhadi","orcid":"https://orcid.org/0000-0003-4631-4438"},"institutions":[{"id":"https://openalex.org/I4210138624","display_name":"University of Washington Bothell","ror":"https://ror.org/02ygzhr13","country_code":"US","type":"education","lineage":["https://openalex.org/I201448701","https://openalex.org/I4210138624"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Afra Mashhadi","raw_affiliation_strings":["Computing and Software Systems, University of Washington, Bothell, WA, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Computing and Software Systems, University of Washington, Bothell, WA, USA","institution_ids":["https://openalex.org/I4210138624"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5085285061"],"corresponding_institution_ids":["https://openalex.org/I23946033"],"apc_list":{"value":1190,"currency":"GBP","value_usd":1459},"apc_paid":{"value":1190,"currency":"GBP","value_usd":1459},"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.00145761,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"15","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.09740000218153,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.09740000218153,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11937","display_name":"Research Data Management Practices","score":0.09109999984502792,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.08500000089406967,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/memorization","display_name":"Memorization","score":0.6751999855041504},{"id":"https://openalex.org/keywords/discipline","display_name":"Discipline","score":0.6462000012397766},{"id":"https://openalex.org/keywords/audit","display_name":"Audit","score":0.5907999873161316},{"id":"https://openalex.org/keywords/scholarship","display_name":"Scholarship","score":0.5192999839782715},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.46149998903274536},{"id":"https://openalex.org/keywords/inequality","display_name":"Inequality","score":0.3456000089645386}],"concepts":[{"id":"https://openalex.org/C30038468","wikidata":"https://www.wikidata.org/wiki/Q4354775","display_name":"Memorization","level":2,"score":0.6751999855041504},{"id":"https://openalex.org/C8795937","wikidata":"https://www.wikidata.org/wiki/Q11862829","display_name":"Discipline","level":2,"score":0.6462000012397766},{"id":"https://openalex.org/C199521495","wikidata":"https://www.wikidata.org/wiki/Q181487","display_name":"Audit","level":2,"score":0.5907999873161316},{"id":"https://openalex.org/C2778061430","wikidata":"https://www.wikidata.org/wiki/Q188823","display_name":"Scholarship","level":2,"score":0.5192999839782715},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.46149998903274536},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.44690001010894775},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.38989999890327454},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.36910000443458557},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.36820000410079956},{"id":"https://openalex.org/C39549134","wikidata":"https://www.wikidata.org/wiki/Q133080","display_name":"Public relations","level":1,"score":0.34769999980926514},{"id":"https://openalex.org/C45555294","wikidata":"https://www.wikidata.org/wiki/Q28113351","display_name":"Inequality","level":2,"score":0.3456000089645386},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.3312000036239624},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.3240000009536743},{"id":"https://openalex.org/C55587333","wikidata":"https://www.wikidata.org/wiki/Q1133029","display_name":"Engineering ethics","level":1,"score":0.3125},{"id":"https://openalex.org/C2991991027","wikidata":"https://www.wikidata.org/wiki/Q6007314","display_name":"Implicit bias","level":2,"score":0.28450000286102295},{"id":"https://openalex.org/C23213167","wikidata":"https://www.wikidata.org/wiki/Q2351730","display_name":"Scientific progress","level":2,"score":0.2752000093460083},{"id":"https://openalex.org/C95713431","wikidata":"https://www.wikidata.org/wiki/Q631425","display_name":"Vulnerability (computing)","level":2,"score":0.2567000091075897},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.2533999979496002},{"id":"https://openalex.org/C108827166","wikidata":"https://www.wikidata.org/wiki/Q175975","display_name":"Internet privacy","level":1,"score":0.2524999976158142}],"mesh":[],"locations_count":6,"locations":[{"id":"doi:10.1140/epjds/s13688-026-00647-0","is_oa":true,"landing_page_url":"https://doi.org/10.1140/epjds/s13688-026-00647-0","pdf_url":"https://link.springer.com/content/pdf/10.1140/epjds/s13688-026-00647-0.pdf","source":{"id":"https://openalex.org/S2504380752","display_name":"EPJ Data Science","issn_l":"2193-1127","issn":["2193-1127"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EPJ Data Science","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2511.00476","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2511.00476","pdf_url":"https://arxiv.org/pdf/2511.00476","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:arXiv.org:2511.00476","is_oa":true,"landing_page_url":"https://arxiv.org/abs/2511.00476","pdf_url":"https://arxiv.org/pdf/2511.00476","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:doi:10.48550/arxiv.2511.00476","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"pmh:oai:doaj.org/article:472a1e906517432a92b25b36e7ec8c12","is_oa":true,"landing_page_url":"https://doaj.org/article/472a1e906517432a92b25b36e7ec8c12","pdf_url":null,"source":{"id":"https://openalex.org/S4306401280","display_name":"DOAJ (DOAJ: Directory of Open Access Journals)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"EPJ Data Science, Vol 15, Iss 1 (2026)","raw_type":"article"},{"id":"doi:10.48550/arxiv.2511.00476","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2511.00476","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.1140/epjds/s13688-026-00647-0","is_oa":true,"landing_page_url":"https://doi.org/10.1140/epjds/s13688-026-00647-0","pdf_url":"https://link.springer.com/content/pdf/10.1140/epjds/s13688-026-00647-0.pdf","source":{"id":"https://openalex.org/S2504380752","display_name":"EPJ Data Science","issn_l":"2193-1127","issn":["2193-1127"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319965","host_organization_name":"Springer Nature","host_organization_lineage":["https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"EPJ Data Science","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4415937783.pdf","grobid_xml":"https://content.openalex.org/works/W4415937783.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Abstract":[0],"Ongoing":[1],"breakthroughs":[2],"in":[3,35,75,174,188],"large":[4],"language":[5],"models":[6],"(LLMs)":[7],"are":[8,43],"reshaping":[9],"scholarly":[10,59,175],"search":[11],"and":[12,31,51,83,93,105,148,166,178],"discovery":[13,176],"interfaces.":[14],"While":[15],"these":[16],"systems":[17],"offer":[18],"new":[19],"possibilities":[20],"for":[21,123,182],"navigating":[22],"scientific":[23],"knowledge,":[24],"they":[25],"also":[26],"raise":[27],"concerns":[28],"about":[29,49],"fairness":[30],"representational":[32],"bias":[33],"rooted":[34],"the":[36,78,164,180],"models\u2019":[37],"memorized":[38],"training":[39],"data.":[40,116],"As":[41],"LLMs":[42,76],"increasingly":[44],"used":[45],"to":[46,56],"answer":[47],"queries":[48],"researchers":[50],"research":[52],"communities,":[53],"their":[54,109],"ability":[55],"accurately":[57],"reconstruct":[58],"coauthor":[60,81,111],"lists":[61,82,112],"becomes":[62],"an":[63],"important":[64],"but":[65],"underexamined":[66],"issue.":[67],"In":[68],"this":[69,85,137],"study,":[70],"we":[71],"investigate":[72],"how":[73],"memorization":[74,130],"affects":[77],"reconstruction":[79,158],"of":[80,153,168,185],"whether":[84],"process":[86],"reflects":[87],"existing":[88],"inequalities":[89],"across":[90],"academic":[91],"disciplines":[92],"world":[94],"regions.":[95],"We":[96],"evaluate":[97],"three":[98],"prominent":[99],"models\u2014DeepSeek":[100],"R1,":[101],"Llama":[102],"4":[103],"Scout,":[104],"Mixtral":[106],"8\u00d77B\u2014by":[107],"comparing":[108],"generated":[110],"against":[113],"bibliographic":[114],"reference":[115],"Our":[117],"analysis":[118],"reveals":[119],"a":[120],"systematic":[121],"advantage":[122],"highly":[124],"cited":[125],"researchers,":[126],"indicating":[127],"that":[128],"LLM":[129],"disproportionately":[131],"favors":[132],"already":[133],"visible":[134],"scholars.":[135],"However,":[136],"pattern":[138],"is":[139],"not":[140],"uniform:":[141],"certain":[142],"disciplines,":[143],"such":[144],"as":[145],"Clinical":[146],"Medicine,":[147],"some":[149],"regions,":[150],"including":[151],"parts":[152],"Africa,":[154],"exhibit":[155],"more":[156],"balanced":[157],"outcomes.":[159],"These":[160],"findings":[161],"highlight":[162],"both":[163],"risks":[165],"limitations":[167],"relying":[169],"on":[170],"LLM-generated":[171],"relational":[172],"knowledge":[173],"contexts":[177],"emphasize":[179],"need":[181],"careful":[183],"auditing":[184],"memorization-driven":[186],"biases":[187],"LLM-based":[189],"systems.":[190]},"counts_by_year":[],"updated_date":"2026-05-13T08:25:38.343686","created_date":"2025-11-05T00:00:00"}
