{"id":"https://openalex.org/W7127127044","doi":"https://doi.org/10.48550/arxiv.2601.22977","title":"Quantifying Model Uniqueness in Heterogeneous AI Ecosystems","display_name":"Quantifying Model Uniqueness in Heterogeneous AI Ecosystems","publication_year":2026,"publication_date":"2026-01-30","ids":{"openalex":"https://openalex.org/W7127127044","doi":"https://doi.org/10.48550/arxiv.2601.22977"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2601.22977","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100401826","display_name":"Lei You","orcid":"https://orcid.org/0000-0002-2697-5776"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"You, Lei","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5100401826"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.19660000503063202,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.19660000503063202,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.11129999905824661,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.050200000405311584,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/uniqueness","display_name":"Uniqueness","score":0.532800018787384},{"id":"https://openalex.org/keywords/redundancy","display_name":"Redundancy (engineering)","score":0.4068000018596649},{"id":"https://openalex.org/keywords/novelty","display_name":"Novelty","score":0.376800000667572},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.36970001459121704},{"id":"https://openalex.org/keywords/a-priori-and-a-posteriori","display_name":"A priori and a posteriori","score":0.365200012922287},{"id":"https://openalex.org/keywords/component","display_name":"Component (thermodynamics)","score":0.359499990940094},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.34040001034736633}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5623000264167786},{"id":"https://openalex.org/C2777021972","wikidata":"https://www.wikidata.org/wiki/Q22976830","display_name":"Uniqueness","level":2,"score":0.532800018787384},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.4068000018596649},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3871000111103058},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3824999928474426},{"id":"https://openalex.org/C2778738651","wikidata":"https://www.wikidata.org/wiki/Q16546687","display_name":"Novelty","level":2,"score":0.376800000667572},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.36970001459121704},{"id":"https://openalex.org/C75553542","wikidata":"https://www.wikidata.org/wiki/Q178161","display_name":"A priori and a posteriori","level":2,"score":0.365200012922287},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.359499990940094},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.34040001034736633},{"id":"https://openalex.org/C199521495","wikidata":"https://www.wikidata.org/wiki/Q181487","display_name":"Audit","level":2,"score":0.3301999866962433},{"id":"https://openalex.org/C2778355321","wikidata":"https://www.wikidata.org/wiki/Q17079427","display_name":"Identity (music)","level":2,"score":0.3212999999523163},{"id":"https://openalex.org/C185429906","wikidata":"https://www.wikidata.org/wiki/Q1130160","display_name":"Estimator","level":2,"score":0.31310001015663147},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.305400013923645},{"id":"https://openalex.org/C79772020","wikidata":"https://www.wikidata.org/wiki/Q5159264","display_name":"Conditional independence","level":2,"score":0.29159998893737793},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.29120001196861267},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.28700000047683716},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.2791999876499176},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.2612000107765198},{"id":"https://openalex.org/C2780233690","wikidata":"https://www.wikidata.org/wiki/Q535347","display_name":"Transparency (behavior)","level":2,"score":0.251800000667572}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2601.22977","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2601.22977","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.22977","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2601.22977","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/15","display_name":"Life in Land","score":0.559382975101471}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"As":[0],"AI":[1,190],"systems":[2],"evolve":[3],"from":[4,21],"isolated":[5],"predictors":[6],"into":[7],"complex,":[8],"heterogeneous":[9,205],"ecosystems":[10],"of":[11,67,78,97,110,201],"foundation":[12],"models":[13,176,180],"and":[14,56,167,182,203],"specialized":[15],"adapters,":[16],"distinguishing":[17],"genuine":[18],"behavioral":[19],"novelty":[20],"functional":[22],"redundancy":[23],"becomes":[24,90],"a":[25,32,68,87,107,123,197],"critical":[26],"governance":[27],"challenge.":[28],"Here,":[29],"we":[30,51,105,121,141],"introduce":[31],"statistical":[33],"framework":[34,159],"for":[35,126],"auditing":[36,99,202],"model":[37,54,206],"uniqueness":[38,58,113],"based":[39],"on":[40],"In-Silico":[41],"Quasi-Experimental":[42],"Design":[43],"(ISQED).":[44],"By":[45],"enforcing":[46],"matched":[47],"interventions":[48],"across":[49,170],"models,":[50],"isolate":[52],"intrinsic":[53],"identity":[55],"quantify":[57],"as":[59,148],"the":[60,65,94,161],"Peer-Inexpressible":[61],"Residual":[62],"(PIER),":[63],"i.e.":[64],"component":[66],"target's":[69],"behavior":[70],"strictly":[71],"irreducible":[72],"to":[73,153],"any":[74],"stochastic":[75],"convex":[76],"combination":[77],"its":[79],"peers,":[80],"with":[81],"vanishing":[82],"PIER":[83],"characterizing":[84],"when":[85],"such":[86,147],"routing-based":[88],"substitution":[89],"possible.":[91],"We":[92,156],"establish":[93,196],"theoretical":[95],"foundations":[96],"ecosystem":[98],"through":[100],"three":[101],"key":[102],"contributions.":[103],"First,":[104],"prove":[106],"fundamental":[108],"limitation":[109],"observational":[111],"logs:":[112],"is":[114],"mathematically":[115],"non-identifiable":[116],"without":[117],"intervention":[118],"control.":[119],"Second,":[120],"derive":[122],"scaling":[124],"law":[125],"active":[127],"auditing,":[128],"showing":[129],"that":[130,143],"our":[131],"adaptive":[132],"query":[133],"protocol":[134],"achieves":[135],"minimax-optimal":[136],"sample":[137],"efficiency":[138],"($d\u03c3^2\u03b3^{-2}\\log(Nd/\u03b4)$).":[139],"Third,":[140],"demonstrate":[142],"cooperative":[144],"game-theoretic":[145],"methods,":[146],"Shapley":[149],"values,":[150],"fundamentally":[151],"fail":[152],"detect":[154],"redundancy.":[155],"implement":[157],"this":[158],"via":[160],"DISCO":[162],"(Design-Integrated":[163],"Synthetic":[164],"Control)":[165],"estimator":[166],"deploy":[168],"it":[169],"diverse":[171],"ecosystems,":[172],"including":[173],"computer":[174],"vision":[175],"(ResNet/ConvNeXt/ViT),":[177],"large":[178],"language":[179],"(BERT/RoBERTa),":[181],"city-scale":[183],"traffic":[184],"forecasters.":[185],"These":[186],"results":[187],"move":[188],"trustworthy":[189],"beyond":[191],"explaining":[192],"single":[193],"models:":[194],"they":[195],"principled,":[198],"intervention-based":[199],"science":[200],"governing":[204],"ecosystems.":[207]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-03T00:00:00"}
