{"id":"https://openalex.org/W7101448010","doi":"https://doi.org/10.48550/arxiv.2510.21204","title":"Mitra: Mixed Synthetic Priors for Enhancing Tabular Foundation Models","display_name":"Mitra: Mixed Synthetic Priors for Enhancing Tabular Foundation Models","publication_year":2025,"publication_date":"2025-10-24","ids":{"openalex":"https://openalex.org/W7101448010","doi":"https://doi.org/10.48550/arxiv.2510.21204"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2510.21204","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2510.21204","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2510.21204","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Zhang, Xiyuan","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhang, Xiyuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Maddix, Danielle C.","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Maddix, Danielle C.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Yin, Junming","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yin, Junming","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Erickson, Nick","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Erickson, Nick","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Ansari, Abdul Fatir","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ansari, Abdul Fatir","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Han, Boran","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Han, Boran","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Zhang, Shuai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Shuai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Akoglu, Leman","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Akoglu, Leman","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Faloutsos, Christos","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Faloutsos, Christos","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Mahoney, Michael W.","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mahoney, Michael W.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Hu, Cuixiong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Cuixiong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Rangwala, Huzefa","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rangwala, Huzefa","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Karypis, George","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Karypis, George","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Wang, Bernie","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Bernie","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":14,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.179299995303154,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.179299995303154,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.16949999332427979,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.10540000349283218,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/prior-probability","display_name":"Prior probability","score":0.8422999978065491},{"id":"https://openalex.org/keywords/foundation","display_name":"Foundation (evidence)","score":0.5515999794006348},{"id":"https://openalex.org/keywords/synthetic-data","display_name":"Synthetic data","score":0.4893999993801117},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.42739999294281006},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.399399995803833},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.36629998683929443}],"concepts":[{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.8422999978065491},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6877999901771545},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6732000112533569},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6353999972343445},{"id":"https://openalex.org/C2780966255","wikidata":"https://www.wikidata.org/wiki/Q5474306","display_name":"Foundation (evidence)","level":2,"score":0.5515999794006348},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.4893999993801117},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.42739999294281006},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.399399995803833},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.36629998683929443},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.3562000095844269},{"id":"https://openalex.org/C83546350","wikidata":"https://www.wikidata.org/wiki/Q1139051","display_name":"Regression","level":2,"score":0.3434999883174896},{"id":"https://openalex.org/C152877465","wikidata":"https://www.wikidata.org/wiki/Q208042","display_name":"Regression analysis","level":2,"score":0.2531999945640564},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.2500999867916107}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2510.21204","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2510.21204","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2510.21204","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2510.21204","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Since":[0],"the":[1,52,63,72,79,91,96],"seminal":[2],"work":[3,89],"of":[4,47,65,105,129],"TabPFN,":[5],"research":[6],"on":[7,13,31,116,125,139],"tabular":[8,55,141],"foundation":[9],"models":[10,29],"(TFMs)":[11],"based":[12],"in-context":[14,48],"learning":[15,57],"(ICL)":[16],"has":[17],"challenged":[18],"long-standing":[19],"paradigms":[20],"in":[21,54],"machine":[22,56],"learning.":[23],"Without":[24],"seeing":[25],"any":[26],"real-world":[27,140],"data,":[28],"pretrained":[30,110],"purely":[32],"synthetic":[33,66,106,130],"datasets":[34],"generalize":[35,113],"remarkably":[36],"well":[37],"across":[38,153],"diverse":[39],"datasets,":[40,67],"often":[41],"using":[42],"only":[43],"a":[44,122,126],"moderate":[45],"number":[46],"examples.":[49],"This":[50,88],"shifts":[51],"focus":[53],"from":[58],"model":[59],"architecture":[60],"design":[61,64,84],"to":[62,71,94,112],"or,":[68],"more":[69],"precisely,":[70],"prior":[73,83],"distributions":[74],"that":[75,108],"generate":[76],"them.":[77],"Yet":[78],"guiding":[80],"principles":[81],"for":[82,133],"remain":[85],"poorly":[86],"understood.":[87],"marks":[90],"first":[92],"attempt":[93],"address":[95],"gap.":[97],"We":[98],"systematically":[99],"investigate":[100],"and":[101,137,151,156],"identify":[102],"key":[103],"properties":[104],"priors":[107,131],"allow":[109],"TFMs":[111],"well.":[114],"Based":[115],"these":[117],"insights,":[118],"we":[119],"introduce":[120],"Mitra,":[121],"TFM":[123],"trained":[124],"curated":[127],"mixture":[128],"selected":[132],"their":[134],"diversity,":[135],"distinctiveness,":[136],"performance":[138],"data.":[142],"Mitra":[143],"consistently":[144],"outperforms":[145],"state-of-the-art":[146],"TFMs,":[147],"such":[148],"as":[149],"TabPFNv2":[150],"TabICL,":[152],"both":[154],"classification":[155],"regression":[157],"benchmarks,":[158],"with":[159],"better":[160],"sample":[161],"efficiency.":[162]},"counts_by_year":[],"updated_date":"2025-11-06T06:51:31.235846","created_date":"2025-10-28T00:00:00"}
