{"id":"https://openalex.org/W7124948151","doi":"https://doi.org/10.1109/cbmi66578.2025.11339342","title":"MMMS: Multi-Modal Multi-Surface Interactive Segmentation","display_name":"MMMS: Multi-Modal Multi-Surface Interactive Segmentation","publication_year":2025,"publication_date":"2025-10-22","ids":{"openalex":"https://openalex.org/W7124948151","doi":"https://doi.org/10.1109/cbmi66578.2025.11339342"},"language":null,"primary_location":{"id":"doi:10.1109/cbmi66578.2025.11339342","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cbmi66578.2025.11339342","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Content-Based Multimedia Indexing (CBMI)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5089961361","display_name":"Robin Sch\u00f6n","orcid":null},"institutions":[{"id":"https://openalex.org/I142270456","display_name":"Technische Hochschule Augsburg","ror":"https://ror.org/016604a03","country_code":"DE","type":"education","lineage":["https://openalex.org/I142270456"]},{"id":"https://openalex.org/I179225836","display_name":"University of Augsburg","ror":"https://ror.org/03p14d497","country_code":"DE","type":"education","lineage":["https://openalex.org/I179225836"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"Robin Sch\u00f6n","raw_affiliation_strings":["Fakult&#x00E4;t f&#x00FC;r Angewandte Informatik, University of Augsburg,Augsburg,Germany"],"affiliations":[{"raw_affiliation_string":"Fakult&#x00E4;t f&#x00FC;r Angewandte Informatik, University of Augsburg,Augsburg,Germany","institution_ids":["https://openalex.org/I179225836","https://openalex.org/I142270456"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069783164","display_name":"Julian Lorenz","orcid":"https://orcid.org/0000-0002-8893-4355"},"institutions":[{"id":"https://openalex.org/I179225836","display_name":"University of Augsburg","ror":"https://ror.org/03p14d497","country_code":"DE","type":"education","lineage":["https://openalex.org/I179225836"]},{"id":"https://openalex.org/I142270456","display_name":"Technische Hochschule Augsburg","ror":"https://ror.org/016604a03","country_code":"DE","type":"education","lineage":["https://openalex.org/I142270456"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Julian Lorenz","raw_affiliation_strings":["Fakult&#x00E4;t f&#x00FC;r Angewandte Informatik, University of Augsburg,Augsburg,Germany"],"affiliations":[{"raw_affiliation_string":"Fakult&#x00E4;t f&#x00FC;r Angewandte Informatik, University of Augsburg,Augsburg,Germany","institution_ids":["https://openalex.org/I179225836","https://openalex.org/I142270456"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012808536","display_name":"Katja Ludwig","orcid":"https://orcid.org/0000-0002-5721-243X"},"institutions":[{"id":"https://openalex.org/I179225836","display_name":"University of Augsburg","ror":"https://ror.org/03p14d497","country_code":"DE","type":"education","lineage":["https://openalex.org/I179225836"]},{"id":"https://openalex.org/I142270456","display_name":"Technische Hochschule Augsburg","ror":"https://ror.org/016604a03","country_code":"DE","type":"education","lineage":["https://openalex.org/I142270456"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Katja Ludwig","raw_affiliation_strings":["Fakult&#x00E4;t f&#x00FC;r Angewandte Informatik, University of Augsburg,Augsburg,Germany"],"affiliations":[{"raw_affiliation_string":"Fakult&#x00E4;t f&#x00FC;r Angewandte Informatik, University of Augsburg,Augsburg,Germany","institution_ids":["https://openalex.org/I179225836","https://openalex.org/I142270456"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123381046","display_name":"Daniel Kienle","orcid":null},"institutions":[{"id":"https://openalex.org/I179225836","display_name":"University of Augsburg","ror":"https://ror.org/03p14d497","country_code":"DE","type":"education","lineage":["https://openalex.org/I179225836"]},{"id":"https://openalex.org/I142270456","display_name":"Technische Hochschule Augsburg","ror":"https://ror.org/016604a03","country_code":"DE","type":"education","lineage":["https://openalex.org/I142270456"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Daniel Kienle","raw_affiliation_strings":["Fakult&#x00E4;t f&#x00FC;r Angewandte Informatik, University of Augsburg,Augsburg,Germany"],"affiliations":[{"raw_affiliation_string":"Fakult&#x00E4;t f&#x00FC;r Angewandte Informatik, University of Augsburg,Augsburg,Germany","institution_ids":["https://openalex.org/I179225836","https://openalex.org/I142270456"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5009744749","display_name":"Rainer Lienhart","orcid":"https://orcid.org/0000-0003-4007-6889"},"institutions":[{"id":"https://openalex.org/I142270456","display_name":"Technische Hochschule Augsburg","ror":"https://ror.org/016604a03","country_code":"DE","type":"education","lineage":["https://openalex.org/I142270456"]},{"id":"https://openalex.org/I179225836","display_name":"University of Augsburg","ror":"https://ror.org/03p14d497","country_code":"DE","type":"education","lineage":["https://openalex.org/I179225836"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Rainer Lienhart","raw_affiliation_strings":["Fakult&#x00E4;t f&#x00FC;r Angewandte Informatik, University of Augsburg,Augsburg,Germany"],"affiliations":[{"raw_affiliation_string":"Fakult&#x00E4;t f&#x00FC;r Angewandte Informatik, University of Augsburg,Augsburg,Germany","institution_ids":["https://openalex.org/I179225836","https://openalex.org/I142270456"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5089961361"],"corresponding_institution_ids":["https://openalex.org/I142270456","https://openalex.org/I179225836"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.7010347,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.23170000314712524,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.23170000314712524,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10719","display_name":"3D Shape Modeling and Analysis","score":0.14669999480247498,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.10679999738931656,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.8385999798774719},{"id":"https://openalex.org/keywords/scale-space-segmentation","display_name":"Scale-space segmentation","score":0.6388999819755554},{"id":"https://openalex.org/keywords/segmentation-based-object-categorization","display_name":"Segmentation-based object categorization","score":0.5788000226020813},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.5577999949455261},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4887000024318695},{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.4830999970436096},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.4580000042915344},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4113999903202057}],"concepts":[{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.8385999798774719},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.763700008392334},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6904000043869019},{"id":"https://openalex.org/C65885262","wikidata":"https://www.wikidata.org/wiki/Q7429708","display_name":"Scale-space segmentation","level":4,"score":0.6388999819755554},{"id":"https://openalex.org/C25694479","wikidata":"https://www.wikidata.org/wiki/Q7446278","display_name":"Segmentation-based object categorization","level":5,"score":0.5788000226020813},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.573199987411499},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.5577999949455261},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4887000024318695},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.4830999970436096},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.4580000042915344},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4113999903202057},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.4083000123500824},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3952000141143799},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.3174000084400177},{"id":"https://openalex.org/C193415008","wikidata":"https://www.wikidata.org/wiki/Q639681","display_name":"Network architecture","level":2,"score":0.3125},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.3043999969959259},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.2957000136375427},{"id":"https://openalex.org/C42314347","wikidata":"https://www.wikidata.org/wiki/Q6865488","display_name":"Minimum spanning tree-based segmentation","level":5,"score":0.28040000796318054},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.26089999079704285}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cbmi66578.2025.11339342","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cbmi66578.2025.11339342","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Conference on Content-Based Multimedia Indexing (CBMI)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W1861492603","https://openalex.org/W2116719896","https://openalex.org/W2121927366","https://openalex.org/W2124351162","https://openalex.org/W2144794286","https://openalex.org/W2470139095","https://openalex.org/W2587989515","https://openalex.org/W2774839435","https://openalex.org/W2921749009","https://openalex.org/W2948672349","https://openalex.org/W2964037732","https://openalex.org/W3034278117","https://openalex.org/W3034586976","https://openalex.org/W3132926949","https://openalex.org/W4312326868","https://openalex.org/W4312336332","https://openalex.org/W4313142416","https://openalex.org/W4313156423","https://openalex.org/W4317905987","https://openalex.org/W4385801616","https://openalex.org/W4386065698","https://openalex.org/W4386071535","https://openalex.org/W4386076428","https://openalex.org/W4386179772","https://openalex.org/W4390872677","https://openalex.org/W4390872789","https://openalex.org/W4390873051","https://openalex.org/W4390873110","https://openalex.org/W4390874575","https://openalex.org/W4391769355","https://openalex.org/W4402716258","https://openalex.org/W4403421044","https://openalex.org/W4406983313","https://openalex.org/W4409917716","https://openalex.org/W4415539405"],"related_works":[],"abstract_inverted_index":{"In":[0],"this":[1,59,80,106],"paper,":[2],"we":[3,45,142,213],"present":[4,31,47],"a":[5,48,83,93,134,234],"method":[6,64,81],"to":[7,22,67,71,123,146,162,175,194,205,216],"interactively":[8],"create":[9],"segmentation":[10,24,74,113,170,238],"masks":[11],"on":[12,105,199,201,207],"the":[13,23,33,56,62,73,77,108,139,148,152,157,163,177,190],"basis":[14],"of":[15,25,58,79,95,179,211],"user":[16],"clicks.":[17,103],"We":[18,115,160,172],"pay":[19],"particular":[20],"attention":[21],"multiple":[26],"surfaces":[27,38],"that":[28,53,120,218],"are":[29,173,214],"simultaneously":[30],"in":[32,225,233],"same":[34],"image.":[35],"Since":[36],"these":[37],"may":[39],"be":[40],"heavily":[41],"entangled":[42],"and":[43,101,156,203,224],"adjacent,":[44],"also":[46],"novel":[49],"extended":[50],"evaluation":[51],"metric":[52],"accounts":[54],"for":[55],"challenges":[57],"scenario.":[60,239],"Additionally,":[61],"presented":[63],"is":[65,82,130],"able":[66,174,215],"use":[68],"multi-modal":[69,158,167,181],"inputs":[70],"facilitate":[72],"task.":[75],"At":[76],"center":[78],"network":[84,109],"architecture":[85,118],"which":[86],"takes":[87],"as":[88,133,166],"input":[89],"an":[90,98,111],"RGB":[91,128],"image,":[92],"number":[94],"non-RGB":[96],"modalities,":[97,186],"erroneous":[99],"mask,":[100],"encoded":[102],"Based":[104],"input,":[107],"predicts":[110],"improved":[112],"mask.":[114],"design":[116],"our":[117,144,180,187,219],"such":[119],"it":[121],"adheres":[122],"two":[124],"conditions:":[125],"(1)":[126],"The":[127],"backbone":[129],"only":[131],"available":[132],"black-box.":[135],"(2)":[136],"To":[137],"reduce":[138],"response":[140],"time,":[141],"want":[143],"model":[145],"integrate":[147],"interaction-specific":[149],"information":[150],"after":[151],"image":[153],"feature":[154],"extraction":[155],"fusion.":[159],"refer":[161],"overall":[164],"task":[165],"multi-surface":[168],"interactive":[169,237],"(MMMS).":[171],"show":[176,217],"effectiveness":[178],"fusion":[182],"strategy.":[183],"Using":[184],"additional":[185],"system":[188],"reduces":[189],"NoC@90":[191],"by":[192],"up":[193,204],"1.28":[195],"clicks":[196],"per":[197],"surface":[198],"average":[200],"DeLiVER":[202],"1.19":[206],"MFNet.":[208],"On":[209],"top":[210],"this,":[212],"RGB-only":[220],"baseline":[221],"achieves":[222],"competitive,":[223],"some":[226],"cases":[227],"even":[228],"superior":[229],"performance":[230],"when":[231],"tested":[232],"classical,":[235],"single-mask":[236]},"counts_by_year":[],"updated_date":"2026-01-22T23:29:09.771500","created_date":"2026-01-21T00:00:00"}
