{"id":"https://openalex.org/W7086945554","doi":"https://doi.org/10.1109/tmm.2025.3618549","title":"ICTNet: Image Complexity-Aware Two-Branch Network With Enhanced Decoding for Real-Time Segmentation","display_name":"ICTNet: Image Complexity-Aware Two-Branch Network With Enhanced Decoding for Real-Time Segmentation","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W7086945554","doi":"https://doi.org/10.1109/tmm.2025.3618549"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2025.3618549","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2025.3618549","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Xin Zhang","orcid":"https://orcid.org/0000-0002-4941-201X"},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xin Zhang","raw_affiliation_strings":["VCIP &amp; TMCC &amp; DISSec, College of Computer Science, Nankai University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"VCIP &amp; TMCC &amp; DISSec, College of Computer Science, Nankai University, Tianjin, China","institution_ids":["https://openalex.org/I205237279"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jinglei Shi","orcid":"https://orcid.org/0000-0003-2926-0415"},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinglei Shi","raw_affiliation_strings":["VCIP &amp; TMCC &amp; DISSec, College of Computer Science, Nankai University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"VCIP &amp; TMCC &amp; DISSec, College of Computer Science, Nankai University, Tianjin, China","institution_ids":["https://openalex.org/I205237279"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Teodor Boyadzhiev","orcid":"https://orcid.org/0000-0002-9554-2608"},"institutions":[{"id":"https://openalex.org/I24768866","display_name":"Bulgarian Academy of Sciences","ror":"https://ror.org/01x8hew03","country_code":"BG","type":"government","lineage":["https://openalex.org/I24768866"]},{"id":"https://openalex.org/I4210105926","display_name":"Institute of Mathematics and Informatics","ror":"https://ror.org/01b5dy719","country_code":"BG","type":"facility","lineage":["https://openalex.org/I24768866","https://openalex.org/I4210105926"]}],"countries":["BG"],"is_corresponding":false,"raw_author_name":"Teodor Boyadzhiev","raw_affiliation_strings":["Institute of Mathematics and Informatics, Bulgarian Academy of Sciences, Sofia, Bulgaria"],"affiliations":[{"raw_affiliation_string":"Institute of Mathematics and Informatics, Bulgarian Academy of Sciences, Sofia, Bulgaria","institution_ids":["https://openalex.org/I4210105926","https://openalex.org/I24768866"]}]},{"author_position":"last","author":{"id":null,"display_name":"Jufeng Yang","orcid":"https://orcid.org/0000-0003-0219-3443"},"institutions":[{"id":"https://openalex.org/I205237279","display_name":"Nankai University","ror":"https://ror.org/01y1kjr75","country_code":"CN","type":"education","lineage":["https://openalex.org/I205237279"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jufeng Yang","raw_affiliation_strings":["VCIP &amp; TMCC &amp; DISSec, College of Computer Science, Nankai University, Tianjin, China"],"affiliations":[{"raw_affiliation_string":"VCIP &amp; TMCC &amp; DISSec, College of Computer Science, Nankai University, Tianjin, China","institution_ids":["https://openalex.org/I205237279"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I205237279"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.54817644,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"27","issue":null,"first_page":"9670","last_page":"9685"},"is_retracted":false,"is_paratext":false,"is_xpac":true,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.8751000165939331,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.8751000165939331,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.03400000184774399,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.017999999225139618,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.6255000233650208},{"id":"https://openalex.org/keywords/spatial-contextual-awareness","display_name":"Spatial contextual awareness","score":0.5526999831199646},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.5432999730110168},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.5328999757766724},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.5181000232696533},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4943000078201294},{"id":"https://openalex.org/keywords/spatial-analysis","display_name":"Spatial analysis","score":0.4934999942779541},{"id":"https://openalex.org/keywords/pixel","display_name":"Pixel","score":0.4869999885559082},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.4693000018596649}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8514999747276306},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6819000244140625},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.6255000233650208},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5849000215530396},{"id":"https://openalex.org/C64754055","wikidata":"https://www.wikidata.org/wiki/Q7574053","display_name":"Spatial contextual awareness","level":2,"score":0.5526999831199646},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.5432999730110168},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5328999757766724},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.5181000232696533},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4943000078201294},{"id":"https://openalex.org/C159620131","wikidata":"https://www.wikidata.org/wiki/Q1938983","display_name":"Spatial analysis","level":2,"score":0.4934999942779541},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.4869999885559082},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.4693000018596649},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4207000136375427},{"id":"https://openalex.org/C205203396","wikidata":"https://www.wikidata.org/wiki/Q612143","display_name":"Bilinear interpolation","level":2,"score":0.38530001044273376},{"id":"https://openalex.org/C141353440","wikidata":"https://www.wikidata.org/wiki/Q182221","display_name":"Fuse (electrical)","level":2,"score":0.3774000108242035},{"id":"https://openalex.org/C137800194","wikidata":"https://www.wikidata.org/wiki/Q11713455","display_name":"Interpolation (computer graphics)","level":3,"score":0.34369999170303345},{"id":"https://openalex.org/C53533937","wikidata":"https://www.wikidata.org/wiki/Q185020","display_name":"Histogram","level":3,"score":0.3116999864578247},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.31049999594688416},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.301800012588501},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.30160000920295715},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.30090001225471497},{"id":"https://openalex.org/C75608658","wikidata":"https://www.wikidata.org/wiki/Q44395","display_name":"Pascal (unit)","level":2,"score":0.3003999888896942},{"id":"https://openalex.org/C179799912","wikidata":"https://www.wikidata.org/wiki/Q205084","display_name":"Computational complexity theory","level":2,"score":0.2892000079154968},{"id":"https://openalex.org/C65885262","wikidata":"https://www.wikidata.org/wiki/Q7429708","display_name":"Scale-space segmentation","level":4,"score":0.2831000089645386},{"id":"https://openalex.org/C63099799","wikidata":"https://www.wikidata.org/wiki/Q17147001","display_name":"Image texture","level":4,"score":0.28060001134872437},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.27970001101493835},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.26269999146461487},{"id":"https://openalex.org/C151416825","wikidata":"https://www.wikidata.org/wiki/Q934791","display_name":"Quadtree","level":2,"score":0.2624000012874603},{"id":"https://openalex.org/C25694479","wikidata":"https://www.wikidata.org/wiki/Q7446278","display_name":"Segmentation-based object categorization","level":5,"score":0.25519999861717224}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2025.3618549","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2025.3618549","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11","score":0.8551862239837646}],"awards":[{"id":"https://openalex.org/G1168484581","display_name":null,"funder_award_id":"SCCI2023YB01","funder_id":"https://openalex.org/F4320321630","funder_display_name":"Dalian University of Technology"},{"id":"https://openalex.org/G4147463729","display_name":null,"funder_award_id":"62302240","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321630","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876"},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":49,"referenced_works":["https://openalex.org/W1677182931","https://openalex.org/W1913356549","https://openalex.org/W2037227137","https://openalex.org/W2117539524","https://openalex.org/W2194775991","https://openalex.org/W2340897893","https://openalex.org/W2476548250","https://openalex.org/W2762439315","https://openalex.org/W2886934227","https://openalex.org/W2887964057","https://openalex.org/W2921495890","https://openalex.org/W2954171777","https://openalex.org/W2963419596","https://openalex.org/W2963890956","https://openalex.org/W2971198903","https://openalex.org/W2999921958","https://openalex.org/W3088146056","https://openalex.org/W3109713717","https://openalex.org/W3112503277","https://openalex.org/W3114677757","https://openalex.org/W3158385340","https://openalex.org/W3169865585","https://openalex.org/W3172265425","https://openalex.org/W3190437803","https://openalex.org/W3194523157","https://openalex.org/W3194686611","https://openalex.org/W3196904463","https://openalex.org/W3197715576","https://openalex.org/W3199130398","https://openalex.org/W3209519737","https://openalex.org/W3215565096","https://openalex.org/W4210643638","https://openalex.org/W4282929256","https://openalex.org/W4285144577","https://openalex.org/W4287891172","https://openalex.org/W4289752563","https://openalex.org/W4312364648","https://openalex.org/W4312688875","https://openalex.org/W4321019952","https://openalex.org/W4322706642","https://openalex.org/W4386076267","https://openalex.org/W4386824854","https://openalex.org/W4388579656","https://openalex.org/W4390097199","https://openalex.org/W4390489106","https://openalex.org/W4392693659","https://openalex.org/W4393159321","https://openalex.org/W4402424158","https://openalex.org/W4402981688"],"related_works":[],"abstract_inverted_index":{"Striking":[0],"a":[1,8,22,77,149],"balance":[2],"between":[3],"speed":[4],"and":[5,43,106,124,136,156,178,184,195,210],"accuracy":[6],"re-mains":[7],"significant":[9],"challenge":[10],"in":[11,96,126],"real-time":[12],"semantic":[13],"segmentation.":[14],"Existing":[15],"methods":[16,34],"typically":[17],"employ":[18],"an":[19,57,144],"encoder-decoder":[20],"or":[21],"multibranch":[23],"structure":[24],"to":[25,165,198],"achieve":[26],"accurate":[27,127],"segmentation":[28,202],"while":[29],"maintaining":[30],"compactness.":[31],"However,":[32],"these":[33,53],"often":[35],"overlook":[36],"the":[37,72,97,101,133,158,167,180,200,207,215],"different":[38],"significance":[39],"of":[40,79,100,182,217],"various":[41],"pixels":[42],"suffer":[44],"from":[45],"insufficient":[46],"spatial":[47,73,89,122,128,139,183],"information":[48,114],"during":[49],"encoding.":[50],"To":[51,130],"address":[52],"challenges,":[54],"we":[55,67,142],"propose":[56],"Image":[58,159],"Complexity-aware":[59],"Two-branch":[60],"Network":[61],"(ICTNet)":[62],"with":[63,82,93],"enhanced":[64,117,145],"decoding.":[65],"Notably,":[66],"introduce":[68],"image":[69,83],"complexity":[70,84],"into":[71,175],"branch":[74,169],"by":[75],"supervising":[76],"partial":[78],"its":[80],"parameters":[81],"maps.":[85],"The":[86,111,171,187,220],"generated":[87],"complexity-aware":[88],"features":[90,95,123,135,174,189],"are":[91,190],"fused":[92,188],"context":[94,113,119,151,185],"intermediate":[98],"period":[99],"encoder":[102],"through":[103,193],"our":[104,218],"Spatial":[105],"Context":[107],"Fusion":[108],"(SCFusion)":[109],"module.":[110],"rich":[112],"can":[115],"provide":[116],"object":[118],"guidance":[120],"for":[121,153],"result":[125],"details.":[129],"fully":[131],"integrate":[132],"twobranch":[134],"recover":[137],"sufficient":[138],"detail":[140],"information,":[141],"design":[143],"decoder":[146],"which":[147],"integrates":[148],"multi-level":[150],"module":[152,164],"feature":[154],"restoration":[155],"develop":[157],"Complexity":[160],"Prior":[161],"Guiding":[162],"(ICPG)":[163],"fuse":[166],"two":[168],"features.":[170,186],"ICPG":[172],"transforms":[173],"attention":[176],"maps":[177],"modulates":[179],"summing":[181],"then":[191],"upsampled":[192],"PixelShuffle":[194],"bilinear":[196],"interpolation":[197],"produce":[199],"final":[201],"results.":[203],"Extensive":[204],"experiments":[205],"on":[206],"Cityscapes,":[208],"CamVid,":[209],"PASCAL":[211],"VOC2012":[212],"datasets":[213],"demonstrate":[214],"effectiveness":[216],"method.":[219],"code":[221],"is":[222],"available":[223],"at":[224],"https://github.com/dalexin/ICTNet.":[225]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
