{"id":"https://openalex.org/W7135038243","doi":"https://doi.org/10.48550/arxiv.2603.10828","title":"BALD-SAM: Disagreement-based Active Prompting in Interactive Segmentation","display_name":"BALD-SAM: Disagreement-based Active Prompting in Interactive Segmentation","publication_year":2026,"publication_date":"2026-03-11","ids":{"openalex":"https://openalex.org/W7135038243","doi":"https://doi.org/10.48550/arxiv.2603.10828"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.10828","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.10828","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.10828","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5038203465","display_name":"Prithwijit Chowdhury","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chowdhury, Prithwijit","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010958338","display_name":"Mohit Prabhushankar","orcid":"https://orcid.org/0000-0002-8743-7058"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Prabhushankar, Mohit","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128865910","display_name":"Ghassan AlRegib","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"AlRegib, Ghassan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.8622999787330627,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.8622999787330627,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.03669999912381172,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.014600000344216824,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.5720000267028809},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.5555999875068665},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.5296000242233276},{"id":"https://openalex.org/keywords/active-learning","display_name":"Active learning (machine learning)","score":0.503000020980835},{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.5009999871253967},{"id":"https://openalex.org/keywords/oracle","display_name":"Oracle","score":0.4876999855041504},{"id":"https://openalex.org/keywords/suite","display_name":"Suite","score":0.4742000102996826},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.44670000672340393},{"id":"https://openalex.org/keywords/bayesian-inference","display_name":"Bayesian inference","score":0.4352000057697296}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7754999995231628},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6427000164985657},{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.5720000267028809},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5555999875068665},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.5296000242233276},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5163000226020813},{"id":"https://openalex.org/C77967617","wikidata":"https://www.wikidata.org/wiki/Q4677561","display_name":"Active learning (machine learning)","level":2,"score":0.503000020980835},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.5009999871253967},{"id":"https://openalex.org/C55166926","wikidata":"https://www.wikidata.org/wiki/Q2892946","display_name":"Oracle","level":2,"score":0.4876999855041504},{"id":"https://openalex.org/C79581498","wikidata":"https://www.wikidata.org/wiki/Q1367530","display_name":"Suite","level":2,"score":0.4742000102996826},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.44670000672340393},{"id":"https://openalex.org/C160234255","wikidata":"https://www.wikidata.org/wiki/Q812535","display_name":"Bayesian inference","level":3,"score":0.4352000057697296},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.39590001106262207},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.38760000467300415},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.3725000023841858},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.37059998512268066},{"id":"https://openalex.org/C93959086","wikidata":"https://www.wikidata.org/wiki/Q6888345","display_name":"Model selection","level":2,"score":0.3093999922275543},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.3075000047683716},{"id":"https://openalex.org/C207201462","wikidata":"https://www.wikidata.org/wiki/Q182505","display_name":"Bayes' theorem","level":3,"score":0.2948000133037567},{"id":"https://openalex.org/C159620131","wikidata":"https://www.wikidata.org/wiki/Q1938983","display_name":"Spatial analysis","level":2,"score":0.28209999203681946},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2709999978542328},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.26249998807907104},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.26030001044273376},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.25920000672340393},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2540000081062317},{"id":"https://openalex.org/C125308379","wikidata":"https://www.wikidata.org/wiki/Q363057","display_name":"Market segmentation","level":2,"score":0.25369998812675476}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.10828","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.10828","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.10828","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.10828","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"Segment":[1],"Anything":[2],"Model":[3],"(SAM)":[4],"has":[5],"revolutionized":[6],"interactive":[7,63],"segmentation":[8,239],"through":[9,197],"spatial":[10,89,131],"prompting.":[11],"While":[12],"existing":[13],"work":[14],"primarily":[15],"focuses":[16],"on":[17,45,188,242],"automating":[18],"prompts":[19,37,102],"in":[20,226,237],"various":[21],"settings,":[22],"real-world":[23],"annotation":[24],"workflows":[25],"involve":[26],"iterative":[27],"refinement":[28],"where":[29,93],"annotators":[30],"observe":[31],"model":[32,145],"outputs":[33],"and":[34,101,146,176,206,244],"strategically":[35],"place":[36],"to":[38,66,71,106,130,152,212],"resolve":[39],"ambiguities.":[40],"Current":[41],"pipelines":[42],"typically":[43],"rely":[44],"the":[46,51,73,78,111,143],"annotator's":[47],"visual":[48],"assessment":[49],"of":[50,113,190],"predicted":[52],"mask":[53],"quality.":[54],"We":[55,116,193],"postulate":[56],"that":[57],"a":[58,68,88,120,153,198],"principled":[59,121],"approach":[60,92],"for":[61,77,163],"automated":[62],"prompting":[64,224],"is":[65],"use":[67],"model-derived":[69],"criterion":[70],"identify":[72],"most":[74],"informative":[75],"region":[76],"next":[79],"prompt.":[80],"In":[81],"this":[82],"work,":[83],"we":[84,141],"establish":[85],"active":[86,90],"prompting:":[87],"learning":[91],"locations":[94],"within":[95],"images":[96],"constitute":[97],"an":[98],"unlabeled":[99],"pool":[100],"serve":[103],"as":[104],"queries":[105],"prioritize":[107],"information-rich":[108],"regions,":[109],"increasing":[110],"utility":[112],"each":[114],"interaction.":[115],"further":[117],"present":[118],"BALD-SAM:":[119],"framework":[122],"adapting":[123],"Bayesian":[124,148],"Active":[125],"Learning":[126],"by":[127,134],"Disagreement":[128],"(BALD)":[129],"prompt":[132],"selection":[133],"quantifying":[135],"epistemic":[136],"uncertainty.":[137],"To":[138],"do":[139],"so,":[140],"freeze":[142],"entire":[144],"apply":[147],"uncertainty":[149,160],"modeling":[150],"only":[151],"small":[154],"learned":[155],"prediction":[156],"head,":[157],"making":[158],"intractable":[159],"estimation":[161],"practical":[162],"large":[164],"multi-million":[165],"parameter":[166],"foundation":[167],"models.":[168],"Across":[169],"16":[170,191],"datasets":[171],"spanning":[172],"natural,":[173],"medical,":[174],"underwater,":[175],"seismic":[177],"domains,":[178],"BALD-SAM":[179,221],"demonstrates":[180],"strong":[181,218],"cross-domain":[182],"performance,":[183,220],"ranking":[184],"first":[185],"or":[186],"second":[187],"14":[189],"benchmarks.":[192],"validate":[194],"these":[195],"gains":[196],"comprehensive":[199],"ablation":[200,215],"suite":[201],"covering":[202],"3":[203],"SAM":[204],"backbones":[205],"35":[207],"Laplace":[208],"posterior":[209],"configurations,":[210],"amounting":[211],"38":[213],"distinct":[214],"settings.":[216],"Beyond":[217],"average":[219],"surpasses":[222],"human":[223],"and,":[225],"several":[227],"categories,":[228],"even":[229],"oracle":[230],"prompting,":[231],"while":[232],"consistently":[233],"outperforming":[234],"one-shot":[235],"baselines":[236],"final":[238],"quality,":[240],"particularly":[241],"thin":[243],"structurally":[245],"complex":[246],"objects.":[247]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-13T00:00:00"}
