{"id":"https://openalex.org/W4416965981","doi":"https://doi.org/10.1109/tmm.2025.3639952","title":"Investigate Interactive Semantic Segmentation via an Uncertainty Mining View","display_name":"Investigate Interactive Semantic Segmentation via an Uncertainty Mining View","publication_year":2025,"publication_date":"2025-12-03","ids":{"openalex":"https://openalex.org/W4416965981","doi":"https://doi.org/10.1109/tmm.2025.3639952"},"language":null,"primary_location":{"id":"doi:10.1109/tmm.2025.3639952","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2025.3639952","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5019412701","display_name":"Yutong Gao","orcid":"https://orcid.org/0000-0002-6766-0703"},"institutions":[{"id":"https://openalex.org/I145897649","display_name":"Minzu University of China","ror":"https://ror.org/0044e2g62","country_code":"CN","type":"education","lineage":["https://openalex.org/I145897649"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yutong Gao","raw_affiliation_strings":["Ministry of Education Key Laboratory of Ethnic Language Intelligent Analysis and Security Governance, School of Information Engineering, Minzu University of China, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-6766-0703","affiliations":[{"raw_affiliation_string":"Ministry of Education Key Laboratory of Ethnic Language Intelligent Analysis and Security Governance, School of Information Engineering, Minzu University of China, Beijing, China","institution_ids":["https://openalex.org/I145897649"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023442981","display_name":"Congyan Lang","orcid":"https://orcid.org/0000-0001-6059-7943"},"institutions":[{"id":"https://openalex.org/I21193070","display_name":"Beijing Jiaotong University","ror":"https://ror.org/01yj56c84","country_code":"CN","type":"education","lineage":["https://openalex.org/I21193070"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Congyan Lang","raw_affiliation_strings":["Beijing Key Laboratory of Traffic Data Analysis and Mining, School of Computer and Information Technology, Beijing Jiaotong University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-6059-7943","affiliations":[{"raw_affiliation_string":"Beijing Key Laboratory of Traffic Data Analysis and Mining, School of Computer and Information Technology, Beijing Jiaotong University, Beijing, China","institution_ids":["https://openalex.org/I21193070"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042271198","display_name":"Fayao Liu","orcid":"https://orcid.org/0000-0001-6649-7660"},"institutions":[{"id":"https://openalex.org/I115228651","display_name":"Agency for Science, Technology and Research","ror":"https://ror.org/036wvzt09","country_code":"SG","type":"government","lineage":["https://openalex.org/I115228651"]},{"id":"https://openalex.org/I3005327000","display_name":"Institute for Infocomm Research","ror":"https://ror.org/053rfa017","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3005327000","https://openalex.org/I91275662"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Fayao Liu","raw_affiliation_strings":["Institute for Infocomm Research, A*STAR, Singapore"],"raw_orcid":"https://orcid.org/0000-0001-6649-7660","affiliations":[{"raw_affiliation_string":"Institute for Infocomm Research, A*STAR, Singapore","institution_ids":["https://openalex.org/I3005327000","https://openalex.org/I115228651"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100451925","display_name":"Xun Xu","orcid":"https://orcid.org/0000-0002-5220-2240"},"institutions":[{"id":"https://openalex.org/I115228651","display_name":"Agency for Science, Technology and Research","ror":"https://ror.org/036wvzt09","country_code":"SG","type":"government","lineage":["https://openalex.org/I115228651"]},{"id":"https://openalex.org/I3005327000","display_name":"Institute for Infocomm Research","ror":"https://ror.org/053rfa017","country_code":"SG","type":"facility","lineage":["https://openalex.org/I115228651","https://openalex.org/I3005327000","https://openalex.org/I91275662"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Xun Xu","raw_affiliation_strings":["Institute for Infocomm Research, A*STAR, Singapore"],"raw_orcid":"https://orcid.org/0000-0002-5220-2240","affiliations":[{"raw_affiliation_string":"Institute for Infocomm Research, A*STAR, Singapore","institution_ids":["https://openalex.org/I3005327000","https://openalex.org/I115228651"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019990791","display_name":"Yuanzhouhan Cao","orcid":"https://orcid.org/0000-0002-2064-8336"},"institutions":[{"id":"https://openalex.org/I21193070","display_name":"Beijing Jiaotong University","ror":"https://ror.org/01yj56c84","country_code":"CN","type":"education","lineage":["https://openalex.org/I21193070"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuanzhouhan Cao","raw_affiliation_strings":["School of Computer Science and Information Technology, Beijing Jiaotong University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-2064-8336","affiliations":[{"raw_affiliation_string":"School of Computer Science and Information Technology, Beijing Jiaotong University, Beijing, China","institution_ids":["https://openalex.org/I21193070"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101250534","display_name":"Lijuan Sun","orcid":null},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lijuan Sun","raw_affiliation_strings":["School of Economics and Management, Key Laboratory of Trustworthy Distributed Computing and Service, Ministry of Education, Beijing University of Posts and Telecommunications, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Economics and Management, Key Laboratory of Trustworthy Distributed Computing and Service, Ministry of Education, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5087043856","display_name":"Yunchao Wei","orcid":"https://orcid.org/0000-0002-2812-8781"},"institutions":[{"id":"https://openalex.org/I21193070","display_name":"Beijing Jiaotong University","ror":"https://ror.org/01yj56c84","country_code":"CN","type":"education","lineage":["https://openalex.org/I21193070"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yunchao Wei","raw_affiliation_strings":["Institute of Information Science, Beijing Jiaotong University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-2812-8781","affiliations":[{"raw_affiliation_string":"Institute of Information Science, Beijing Jiaotong University, Beijing, China","institution_ids":["https://openalex.org/I21193070"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5019412701"],"corresponding_institution_ids":["https://openalex.org/I145897649"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.37415929,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"28","issue":null,"first_page":"1613","last_page":"1625"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.4659999907016754,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.4659999907016754,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.07760000228881836,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10799","display_name":"Data Visualization and Analytics","score":0.03819999843835831,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.7092000246047974},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.5533999800682068},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.5012000203132629},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.48339998722076416},{"id":"https://openalex.org/keywords/scheme","display_name":"Scheme (mathematics)","score":0.4462999999523163},{"id":"https://openalex.org/keywords/semantic-computing","display_name":"Semantic computing","score":0.37299999594688416},{"id":"https://openalex.org/keywords/confusion","display_name":"Confusion","score":0.3483000099658966}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.9086999893188477},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.7092000246047974},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.5533999800682068},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5271999835968018},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.5012000203132629},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.48339998722076416},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.4462999999523163},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4032000005245209},{"id":"https://openalex.org/C511149849","wikidata":"https://www.wikidata.org/wiki/Q7449051","display_name":"Semantic computing","level":3,"score":0.37299999594688416},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.357699990272522},{"id":"https://openalex.org/C2781140086","wikidata":"https://www.wikidata.org/wiki/Q557945","display_name":"Confusion","level":2,"score":0.3483000099658966},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.34779998660087585},{"id":"https://openalex.org/C188198153","wikidata":"https://www.wikidata.org/wiki/Q1613840","display_name":"Limiting","level":2,"score":0.33340001106262207},{"id":"https://openalex.org/C130318100","wikidata":"https://www.wikidata.org/wiki/Q2268914","display_name":"Semantic similarity","level":2,"score":0.32510000467300415},{"id":"https://openalex.org/C193125573","wikidata":"https://www.wikidata.org/wiki/Q7449065","display_name":"Semantic interpretation","level":2,"score":0.3188999891281128},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.3181000053882599},{"id":"https://openalex.org/C155512373","wikidata":"https://www.wikidata.org/wiki/Q287450","display_name":"Residual","level":2,"score":0.30079999566078186},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.2924000024795532},{"id":"https://openalex.org/C67712803","wikidata":"https://www.wikidata.org/wiki/Q7901853","display_name":"User modeling","level":3,"score":0.2662999927997589},{"id":"https://openalex.org/C2777946921","wikidata":"https://www.wikidata.org/wiki/Q7449044","display_name":"Semantic analysis (machine learning)","level":2,"score":0.2556000053882599}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2025.3639952","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2025.3639952","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4786667784","display_name":null,"funder_award_id":"L221011","funder_id":"https://openalex.org/F4320322919","funder_display_name":"Natural Science Foundation of Beijing Municipality"},{"id":"https://openalex.org/G6960108870","display_name":null,"funder_award_id":"A20H6b0151","funder_id":"https://openalex.org/F4320320696","funder_display_name":"Agency for Science, Technology and Research"},{"id":"https://openalex.org/G8099282535","display_name":null,"funder_award_id":"BATLAB202403","funder_id":"https://openalex.org/F4320312071","funder_display_name":"Ministry of Education, Libya"}],"funders":[{"id":"https://openalex.org/F4320312071","display_name":"Ministry of Education, Libya","ror":"https://ror.org/02w030k33"},{"id":"https://openalex.org/F4320320696","display_name":"Agency for Science, Technology and Research","ror":"https://ror.org/036wvzt09"},{"id":"https://openalex.org/F4320322919","display_name":"Natural Science Foundation of Beijing Municipality","ror":null},{"id":"https://openalex.org/F4320323066","display_name":"Beijing Jiaotong University","ror":"https://ror.org/01yj56c84"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":52,"referenced_works":["https://openalex.org/W1967268147","https://openalex.org/W2083277843","https://openalex.org/W2104095591","https://openalex.org/W2121947440","https://openalex.org/W2124351162","https://openalex.org/W2169551590","https://openalex.org/W2294819727","https://openalex.org/W2300469113","https://openalex.org/W2763160469","https://openalex.org/W2769833683","https://openalex.org/W2770462575","https://openalex.org/W2776163999","https://openalex.org/W2787091153","https://openalex.org/W2789103781","https://openalex.org/W2795276939","https://openalex.org/W2798769484","https://openalex.org/W2895800749","https://openalex.org/W2948553897","https://openalex.org/W2956371155","https://openalex.org/W2963072537","https://openalex.org/W2964037732","https://openalex.org/W2964221652","https://openalex.org/W2964252655","https://openalex.org/W2965289249","https://openalex.org/W2967279867","https://openalex.org/W3011572863","https://openalex.org/W3034278117","https://openalex.org/W3034550159","https://openalex.org/W3034586976","https://openalex.org/W3087845270","https://openalex.org/W3093450153","https://openalex.org/W3093644825","https://openalex.org/W3096945436","https://openalex.org/W3132926949","https://openalex.org/W3138986594","https://openalex.org/W3148848505","https://openalex.org/W3204877997","https://openalex.org/W3211091494","https://openalex.org/W3213143587","https://openalex.org/W4214588164","https://openalex.org/W4214893857","https://openalex.org/W4220834633","https://openalex.org/W4285222939","https://openalex.org/W4289387907","https://openalex.org/W4312336332","https://openalex.org/W4312603257","https://openalex.org/W4386075720","https://openalex.org/W4386075998","https://openalex.org/W4386076245","https://openalex.org/W4390872677","https://openalex.org/W4390872789","https://openalex.org/W4390874575"],"related_works":[],"abstract_inverted_index":{"With":[0],"the":[1,48,117,133,137,141,150,154,160,164,179,210,213,240,244,252,259,270,276],"rapid":[2],"development":[3,76],"of":[4,120,212,261,272],"intelligence":[5],"media,":[6],"traditional":[7,25],"semantic":[8,43,60,219,231,249,286],"segmentation":[9,26,39,44,61,287],"has":[10,73],"shown":[11],"excellent":[12],"potential":[13],"in":[14,34,78,153],"application":[15,80],"scenarios":[16],"like":[17],"autonomous":[18],"driving.":[19],"However,":[20],"due":[21,53],"to":[22,30,54,57,104,136,171,221,237],"limited":[23],"performance,":[24],"models":[27],"usually":[28],"lead":[29,170],"poor":[31],"user":[32,122,127,165],"experiences":[33],"applications":[35],"that":[36],"require":[37],"high":[38],"precision.":[40],"Therefore,":[41],"interactive":[42,100],"(ISS)":[45],"is":[46,50],"gaining":[47,51],"attention":[49,52],"its":[55,218],"capability":[56],"generate":[58],"high-precision":[59],"results":[62],"through":[63,264],"a":[64,74,187,223,230],"few":[65],"user-provided":[66],"clicks":[67,123],"for":[68,140,275],"experience":[69],"improvement,":[70],"which":[71,158],"thus":[72],"promising":[75],"prospect":[77],"fine-grained":[79],"scenarios,":[81],"<italic":[82,91,129],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[83,92,130],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">e.g.</i>,":[84],"virtual":[85],"reality,":[86],"smart":[87],"medical,":[88],"data":[89],"annotation,":[90],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">etc.</i>.":[93],"For":[94],"good":[95],"interaction":[96,156,161,180],"efficiency,":[97],"most":[98],"existing":[99],"methods":[101],"make":[102],"efforts":[103],"conduct":[105],"suitable":[106],"click":[107,112,173,176,202,214,225,253],"simulation":[108,174,205,215],"strategies":[109],"and":[110,124,163,175,217,254,267],"reasonable":[111,188,224],"encoding":[113,234],"methods,":[114],"aiming":[115],"at":[116],"robust":[118],"understanding":[119],"diverse":[121],"translating":[125],"comprehensible":[126],"intent,":[128],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">i.e.</i>,":[131],"assign":[132],"correct":[134],"category":[135],"clicked":[138],"area,":[139],"neural":[142],"network.":[143],"Though":[144],"proved":[145],"effective,":[146],"their":[147],"designs":[148],"ignore":[149],"uncertainty":[151,193,211,232,273],"hiding":[152],"extracted":[155],"features,":[157],"reflects":[159],"difficulty":[162],"clicking":[166],"intents.":[167],"This":[168],"can":[169,280],"inappropriate":[172],"encoding,":[177],"limiting":[178],"efficiency.":[181],"Hence":[182],"we":[183,197,228],"focus":[184],"on":[185,284],"exploring":[186],"ISS":[189],"scheme":[190],"via":[191],"an":[192,199],"mining":[194,248,274],"view.":[195],"Specifically,":[196],"propose":[198,229],"uncertainty-based":[200],"class-balanced":[201],"sampling":[203],"(UCCS)":[204],"strategy":[206],"by":[207,247],"considering":[208],"both":[209],"region":[216],"imbalance,":[220],"form":[222],"distribution.":[226],"Furthermore,":[227],"residual":[233],"(SURE)":[235],"method":[236],"better":[238],"embed":[239],"user's":[241],"intention":[242],"into":[243],"localization":[245],"maps,":[246],"confusion":[250],"between":[251],"misprediction":[255],"classes.":[256],"We":[257],"prove":[258],"effectiveness":[260],"our":[262],"design":[263],"extensive":[265],"experiments":[266],"initially":[268],"analyze":[269],"importance":[271],"ISS.":[277],"Our":[278],"model":[279],"achieve":[281],"state-of-the-art":[282],"performance":[283],"three":[285],"benchmarks.":[288]},"counts_by_year":[],"updated_date":"2026-03-09T07:00:12.390032","created_date":"2025-12-03T00:00:00"}
