{"id":"https://openalex.org/W7140129268","doi":"https://doi.org/10.48550/arxiv.2603.20191","title":"Deterministic Mode Proposals: An Efficient Alternative to Generative Sampling for Ambiguous Segmentation","display_name":"Deterministic Mode Proposals: An Efficient Alternative to Generative Sampling for Ambiguous Segmentation","publication_year":2026,"publication_date":"2026-03-20","ids":{"openalex":"https://openalex.org/W7140129268","doi":"https://doi.org/10.48550/arxiv.2603.20191"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.20191","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.20191","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.20191","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5130374030","display_name":"Sebastian Gerard","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gerard, Sebastian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5088465676","display_name":"Josephine Sullivan","orcid":"https://orcid.org/0000-0003-2784-7300"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sullivan, Josephine","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.7145000100135803,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.7145000100135803,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.07569999992847443,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.05609999969601631,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.7222999930381775},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6444000005722046},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.5879999995231628},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.5051000118255615},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.4975000023841858},{"id":"https://openalex.org/keywords/mode","display_name":"Mode (computer interface)","score":0.48579999804496765},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.45660001039505005},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.4521999955177307},{"id":"https://openalex.org/keywords/scale-space-segmentation","display_name":"Scale-space segmentation","score":0.43290001153945923}],"concepts":[{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.7222999930381775},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6444000005722046},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.637499988079071},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.5879999995231628},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5390999913215637},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.5051000118255615},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.4975000023841858},{"id":"https://openalex.org/C48677424","wikidata":"https://www.wikidata.org/wiki/Q6888088","display_name":"Mode (computer interface)","level":2,"score":0.48579999804496765},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.45660001039505005},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.4521999955177307},{"id":"https://openalex.org/C65885262","wikidata":"https://www.wikidata.org/wiki/Q7429708","display_name":"Scale-space segmentation","level":4,"score":0.43290001153945923},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.4244000017642975},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.42399999499320984},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4162999987602234},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.38839998841285706},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.3878999948501587},{"id":"https://openalex.org/C25694479","wikidata":"https://www.wikidata.org/wiki/Q7446278","display_name":"Segmentation-based object categorization","level":5,"score":0.38530001044273376},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.37869998812675476},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3303000032901764},{"id":"https://openalex.org/C149441793","wikidata":"https://www.wikidata.org/wiki/Q200726","display_name":"Probability distribution","level":2,"score":0.29030001163482666},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.2872999906539917},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.28380000591278076},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.27790001034736633},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.25760000944137573},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.2574000060558319},{"id":"https://openalex.org/C167723999","wikidata":"https://www.wikidata.org/wiki/Q3773214","display_name":"Sampling distribution","level":2,"score":0.257099986076355},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.25279998779296875}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.20191","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.20191","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.20191","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.20191","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Many":[0],"segmentation":[1,7,113],"tasks,":[2],"such":[3],"as":[4],"medical":[5],"image":[6],"or":[8],"future":[9],"state":[10],"prediction,":[11],"are":[12,19],"inherently":[13],"ambiguous,":[14],"meaning":[15],"that":[16,80,133,155],"multiple":[17],"predictions":[18],"equally":[20],"correct.":[21],"Current":[22],"methods":[23,43],"typically":[24],"rely":[25],"on":[26],"generative":[27,128],"models":[28],"to":[29,65,108,149],"capture":[30],"this":[31,56],"uncertainty.":[32],"However,":[33],"identifying":[34],"the":[35,39,60,66,109,141,158],"underlying":[36],"modes":[37],"of":[38,50,69,86,112,144,161],"distribution":[40,143],"with":[41],"these":[42],"is":[44],"computationally":[45],"expensive,":[46],"requiring":[47],"large":[48],"numbers":[49],"samples":[51],"and":[52],"post-hoc":[53],"clustering.":[54],"In":[55],"paper,":[57],"we":[58,98,131,153,166],"shift":[59],"focus":[61],"from":[62],"stochastic":[63],"sampling":[64],"direct":[67],"generation":[68],"likely":[70],"outcomes.":[71],"We":[72],"introduce":[73],"mode":[74,171],"proposal":[75,87],"models,":[76],"a":[77,83,90,100,162],"deterministic":[78],"framework":[79],"efficiently":[81,168],"produces":[82],"fixed-size":[84],"set":[85],"masks":[88],"in":[89,105],"single":[91],"forward":[92],"pass.":[93],"To":[94],"handle":[95],"superfluous":[96],"proposals,":[97],"adapt":[99],"confidence":[101],"mechanism,":[102],"traditionally":[103],"used":[104],"object":[106],"detection,":[107],"high-dimensional":[110],"space":[111],"masks.":[114],"Our":[115],"approach":[116],"significantly":[117],"reduces":[118],"inference":[119],"time":[120],"while":[121],"achieving":[122],"higher":[123],"ground-truth":[124],"coverage":[125],"than":[126],"existing":[127],"models.":[129],"Furthermore,":[130],"demonstrate":[132],"our":[134,174],"model":[135],"can":[136,167],"be":[137],"trained":[138],"without":[139],"knowing":[140],"full":[142],"outcomes,":[145],"making":[146],"it":[147],"applicable":[148],"real-world":[150],"datasets.":[151],"Finally,":[152],"show":[154],"by":[156],"decomposing":[157],"velocity":[159],"field":[160],"pre-trained":[163],"flow":[164],"model,":[165],"estimate":[169],"prior":[170],"probabilities":[172],"for":[173],"proposals.":[175]},"counts_by_year":[],"updated_date":"2026-07-01T06:00:48.157686","created_date":"2026-03-24T00:00:00"}
