{"id":"https://openalex.org/W7140517056","doi":"https://doi.org/10.48550/arxiv.2603.24569","title":"POLY-SIM: Polyglot Speaker Identification with Missing Modality Grand Challenge 2026 Evaluation Plan","display_name":"POLY-SIM: Polyglot Speaker Identification with Missing Modality Grand Challenge 2026 Evaluation Plan","publication_year":2026,"publication_date":"2026-03-25","ids":{"openalex":"https://openalex.org/W7140517056","doi":"https://doi.org/10.48550/arxiv.2603.24569"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.24569","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.24569","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.24569","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102755522","display_name":"Marta Moscati","orcid":"https://orcid.org/0000-0002-5541-4919"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Moscati, Marta","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101076782","display_name":"Muhammad Saad Saeed","orcid":"https://orcid.org/0000-0002-0893-9499"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Saeed, Muhammad Saad","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120366257","display_name":"Marina Zanoni","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zanoni, Marina","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020931012","display_name":"Mubashir Noman","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Noman, Mubashir","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029637694","display_name":"Rohan Kumar Das","orcid":"https://orcid.org/0000-0002-1332-3357"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Das, Rohan Kumar","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023575441","display_name":"Monorama Swain","orcid":"https://orcid.org/0000-0002-3768-857X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Swain, Monorama","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130659481","display_name":"Yufang Hou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hou, Yufang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130689106","display_name":"Elisabeth Andre","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Andre, Elisabeth","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024102795","display_name":"Khalid Mahmood Malik","orcid":"https://orcid.org/0000-0002-7927-3436"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Malik, Khalid Mahmood","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091259315","display_name":"Markus Schedl","orcid":"https://orcid.org/0000-0003-1706-3406"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Schedl, Markus","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5130664596","display_name":"Shah Nawaz","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nawaz, Shah","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":11,"corresponding_author_ids":["https://openalex.org/A5102755522"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.5597000122070312,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.5597000122070312,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.3529999852180481,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.005799999926239252,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speaker-identification","display_name":"Speaker identification","score":0.6790000200271606},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6438999772071838},{"id":"https://openalex.org/keywords/identification","display_name":"Identification (biology)","score":0.6043999791145325},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.5752999782562256},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.5712000131607056},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.46700000762939453},{"id":"https://openalex.org/keywords/polyglot","display_name":"Polyglot","score":0.4577000141143799},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.44350001215934753}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7681999802589417},{"id":"https://openalex.org/C2986627078","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker identification","level":3,"score":0.6790000200271606},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6438999772071838},{"id":"https://openalex.org/C116834253","wikidata":"https://www.wikidata.org/wiki/Q2039217","display_name":"Identification (biology)","level":2,"score":0.6043999791145325},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5753999948501587},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.5752999782562256},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.5712000131607056},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5031999945640564},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.47369998693466187},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.46700000762939453},{"id":"https://openalex.org/C2780239667","wikidata":"https://www.wikidata.org/wiki/Q2102850","display_name":"Polyglot","level":2,"score":0.4577000141143799},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.44350001215934753},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.43790000677108765},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.41589999198913574},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4156999886035919},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.37049999833106995},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.33309999108314514},{"id":"https://openalex.org/C9357733","wikidata":"https://www.wikidata.org/wiki/Q6878417","display_name":"Missing data","level":2,"score":0.3310000002384186},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.3276999890804291},{"id":"https://openalex.org/C135641252","wikidata":"https://www.wikidata.org/wiki/Q738567","display_name":"Multimodal interaction","level":2,"score":0.28929999470710754},{"id":"https://openalex.org/C203005215","wikidata":"https://www.wikidata.org/wiki/Q79798","display_name":"Machine translation","level":2,"score":0.2849000096321106},{"id":"https://openalex.org/C2776505523","wikidata":"https://www.wikidata.org/wiki/Q4785468","display_name":"Plan (archaeology)","level":2,"score":0.273499995470047},{"id":"https://openalex.org/C155092808","wikidata":"https://www.wikidata.org/wiki/Q182557","display_name":"Computational linguistics","level":2,"score":0.26919999718666077}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.24569","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.24569","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.24569","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.24569","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.7838742733001709,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Multimodal":[0],"speaker":[1,64,78,152],"identification":[2,65,79,153],"systems":[3],"typically":[4],"assume":[5],"the":[6,58,86,90,112,117,123,140],"availability":[7],"of":[8,62,92,116],"complete":[9],"and":[10,17,60,82,114,129,137,149],"homogeneous":[11],"audio-visual":[12],"modalities":[13],"during":[14],"both":[15],"training":[16],"testing.":[18],"However,":[19],"in":[20,76],"real-world":[21],"applications,":[22],"such":[23],"assumptions":[24],"often":[25],"do":[26],"not":[27],"hold.":[28],"Visual":[29],"information":[30],"may":[31],"be":[32],"missing":[33],"due":[34,48],"to":[35,49,73,143],"occlusions,":[36],"camera":[37],"failures,":[38],"or":[39],"privacy":[40],"constraints,":[41],"while":[42,102],"multilingual":[43],"speakers":[44],"introduce":[45],"additional":[46],"complexity":[47],"linguistic":[50],"variability":[51],"across":[52,106],"languages.":[53,108],"These":[54],"challenges":[55],"significantly":[56],"affect":[57],"robustness":[59],"generalization":[61],"multimodal":[63,77,100,151],"systems.":[66,154],"The":[67],"POLY-SIM":[68,118],"Grand":[69,87,119],"Challenge":[70,88,120],"2026":[71],"aims":[72,142],"advance":[74],"research":[75],"under":[80],"missing-modality":[81],"cross-lingual":[83],"conditions.":[84],"Specifically,":[85],"encourages":[89],"development":[91],"robust":[93,148],"methods":[94],"that":[95],"can":[96],"effectively":[97],"leverage":[98],"incomplete":[99],"inputs":[101],"maintaining":[103],"strong":[104],"performance":[105],"different":[107],"This":[109],"report":[110],"presents":[111],"design":[113],"organization":[115],"2026,":[121],"including":[122],"dataset,":[124],"task":[125],"formulation,":[126],"evaluation":[127,138],"protocol,":[128],"baseline":[130],"model.":[131],"By":[132],"providing":[133],"a":[134],"standardized":[135],"benchmark":[136],"framework,":[139],"challenge":[141],"foster":[144],"progress":[145],"toward":[146],"more":[147],"practical":[150]},"counts_by_year":[],"updated_date":"2026-05-04T08:30:34.212998","created_date":"2026-03-27T00:00:00"}
