{"id":"https://openalex.org/W4396523499","doi":"https://doi.org/10.1109/access.2024.3395541","title":"Research on Image Semantic Segmentation Based on Hybrid Cascade Feature Fusion and Detailed Attention Mechanism","display_name":"Research on Image Semantic Segmentation Based on Hybrid Cascade Feature Fusion and Detailed Attention Mechanism","publication_year":2024,"publication_date":"2024-01-01","ids":{"openalex":"https://openalex.org/W4396523499","doi":"https://doi.org/10.1109/access.2024.3395541"},"language":"en","primary_location":{"id":"doi:10.1109/access.2024.3395541","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2024.3395541","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10510434.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10510434.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5009376283","display_name":"Zhongkui Du","orcid":"https://orcid.org/0009-0003-1506-0276"},"institutions":[{"id":"https://openalex.org/I41208885","display_name":"Harbin University of Commerce","ror":"https://ror.org/03zsxkw25","country_code":"CN","type":"education","lineage":["https://openalex.org/I41208885"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zuoqiang Du","raw_affiliation_strings":["School of Computer and Information Engineering, Harbin University of Commerce, Harbin, China"],"affiliations":[{"raw_affiliation_string":"School of Computer and Information Engineering, Harbin University of Commerce, Harbin, China","institution_ids":["https://openalex.org/I41208885"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100390967","display_name":"Yuan Liang","orcid":"https://orcid.org/0009-0005-1426-2022"},"institutions":[{"id":"https://openalex.org/I4210144143","display_name":"Inspur (China)","ror":"https://ror.org/0474p4r72","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210144143"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuan Liang","raw_affiliation_strings":["Jinan Inspur Data Technology Company Ltd., Jinan, China"],"affiliations":[{"raw_affiliation_string":"Jinan Inspur Data Technology Company Ltd., Jinan, China","institution_ids":["https://openalex.org/I4210144143"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5009376283"],"corresponding_institution_ids":["https://openalex.org/I41208885"],"apc_list":{"value":1850,"currency":"USD","value_usd":1850},"apc_paid":{"value":1850,"currency":"USD","value_usd":1850},"fwci":2.1053,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.87953713,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"12","issue":null,"first_page":"62365","last_page":"62377"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9761999845504761,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9689000248908997,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7908229827880859},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7742748260498047},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6440854072570801},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.6373059153556824},{"id":"https://openalex.org/keywords/image-segmentation","display_name":"Image segmentation","score":0.5920618772506714},{"id":"https://openalex.org/keywords/scale-space-segmentation","display_name":"Scale-space segmentation","score":0.5201299786567688},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5196484327316284},{"id":"https://openalex.org/keywords/pyramid","display_name":"Pyramid (geometry)","score":0.506117045879364},{"id":"https://openalex.org/keywords/pooling","display_name":"Pooling","score":0.5046447515487671},{"id":"https://openalex.org/keywords/segmentation-based-object-categorization","display_name":"Segmentation-based object categorization","score":0.503980815410614},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.4868170917034149},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.45326468348503113},{"id":"https://openalex.org/keywords/fusion-mechanism","display_name":"Fusion mechanism","score":0.44035035371780396},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.12852105498313904},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.08906272053718567}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7908229827880859},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7742748260498047},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6440854072570801},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.6373059153556824},{"id":"https://openalex.org/C124504099","wikidata":"https://www.wikidata.org/wiki/Q56933","display_name":"Image segmentation","level":3,"score":0.5920618772506714},{"id":"https://openalex.org/C65885262","wikidata":"https://www.wikidata.org/wiki/Q7429708","display_name":"Scale-space segmentation","level":4,"score":0.5201299786567688},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5196484327316284},{"id":"https://openalex.org/C142575187","wikidata":"https://www.wikidata.org/wiki/Q3358290","display_name":"Pyramid (geometry)","level":2,"score":0.506117045879364},{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.5046447515487671},{"id":"https://openalex.org/C25694479","wikidata":"https://www.wikidata.org/wiki/Q7446278","display_name":"Segmentation-based object categorization","level":5,"score":0.503980815410614},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.4868170917034149},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.45326468348503113},{"id":"https://openalex.org/C173414695","wikidata":"https://www.wikidata.org/wiki/Q5510276","display_name":"Fusion mechanism","level":4,"score":0.44035035371780396},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.12852105498313904},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.08906272053718567},{"id":"https://openalex.org/C103038307","wikidata":"https://www.wikidata.org/wiki/Q6556360","display_name":"Lipid bilayer fusion","level":3,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/access.2024.3395541","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2024.3395541","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10510434.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:5d7738f77d81475ea83ab6db0723ab21","is_oa":true,"landing_page_url":"https://doaj.org/article/5d7738f77d81475ea83ab6db0723ab21","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"IEEE Access, Vol 12, Pp 62365-62377 (2024)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.1109/access.2024.3395541","is_oa":true,"landing_page_url":"https://doi.org/10.1109/access.2024.3395541","pdf_url":"https://ieeexplore.ieee.org/ielx7/6287639/6514899/10510434.pdf","source":{"id":"https://openalex.org/S2485537415","display_name":"IEEE Access","issn_l":"2169-3536","issn":["2169-3536"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Access","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3601016450","display_name":null,"funder_award_id":"UNPYSCT-2020212","funder_id":"https://openalex.org/F4320327728","funder_display_name":"University Nursing Program for Young Scholar with Creative Talents in Heilongjiang Province"},{"id":"https://openalex.org/G589937780","display_name":null,"funder_award_id":"606750192","funder_id":"https://openalex.org/F4320323085","funder_display_name":"Natural Science Foundation of Heilongjiang Province"}],"funders":[{"id":"https://openalex.org/F4320323085","display_name":"Natural Science Foundation of Heilongjiang Province","ror":null},{"id":"https://openalex.org/F4320327728","display_name":"University Nursing Program for Young Scholar with Creative Talents in Heilongjiang Province","ror":null}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4396523499.pdf"},"referenced_works_count":32,"referenced_works":["https://openalex.org/W1901129140","https://openalex.org/W1903029394","https://openalex.org/W2412782625","https://openalex.org/W2560023338","https://openalex.org/W2563705555","https://openalex.org/W2630837129","https://openalex.org/W2940791683","https://openalex.org/W2954300568","https://openalex.org/W2963136578","https://openalex.org/W2972546487","https://openalex.org/W2986118726","https://openalex.org/W2991471181","https://openalex.org/W3132467470","https://openalex.org/W3134896931","https://openalex.org/W3136715451","https://openalex.org/W3154623612","https://openalex.org/W3166513127","https://openalex.org/W3200184518","https://openalex.org/W3201009223","https://openalex.org/W3209745495","https://openalex.org/W3211512919","https://openalex.org/W4210485727","https://openalex.org/W4221015298","https://openalex.org/W4225935108","https://openalex.org/W4312746086","https://openalex.org/W4320026650","https://openalex.org/W4379385793","https://openalex.org/W4379470079","https://openalex.org/W6684191040","https://openalex.org/W6739696289","https://openalex.org/W6775064670","https://openalex.org/W6779932004"],"related_works":["https://openalex.org/W2022849497","https://openalex.org/W3081299480","https://openalex.org/W2407190427","https://openalex.org/W2919210741","https://openalex.org/W2907584218","https://openalex.org/W3002446410","https://openalex.org/W4390224712","https://openalex.org/W4322096758","https://openalex.org/W3144569342","https://openalex.org/W2185902295"],"abstract_inverted_index":{"In":[0],"view":[1],"of":[2,13,42,50,63,114,139,232],"the":[3,40,44,47,61,66,69,88,111,115,119,122,135,140,146,152,184,193,201,209,229,233],"low":[4],"segmentation":[5,12,18,30,48,76,160,166],"accuracy":[6,49,231],"for":[7,16],"small-scale":[8,51],"object":[9,52,67],"and":[10,36,53,58,82,87,91,121,142,155,163,171,189,214,222,225],"insufficient":[11],"local":[14,54],"boundary":[15,55],"semantic":[17,29,75,100,137,159,165],"methods":[19,94],"based":[20,32,78,168],"on":[21,33,79,169,208],"Deep":[22],"Learning,":[23],"this":[24,237],"paper":[25,238],"proposes":[26],"an":[27,73],"image":[28,74,158,164],"approach":[31,106,234],"attention":[34,147,172,177,182,195],"mechanism":[35,148,196],"feature":[37,83,156,187],"fusion.":[38],"On":[39],"basis":[41],"ensuring":[43],"overall":[45,230],"accuracy,":[46],"is":[56,85,107,149,174,178,197,239],"improved,":[57],"it":[59,226],"meets":[60],"requirement":[62],"accurately":[64],"segmenting":[65],"in":[68,118,192,236],"complex":[70],"background.":[71],"Firstly,":[72],"model":[77,167],"hybrid":[80,89,153],"cascade":[81,154],"fusion":[84,105,157],"proposed,":[86],"concatenation":[90],"multi-cores":[92],"pooling":[93],"are":[95],"used":[96,198],"to":[97,109,132,180,199],"extract":[98],"deeper":[99],"information.":[101],"Then,":[102],"a":[103],"cross-stages":[104,170],"designed":[108],"divide":[110],"backbone":[112],"network":[113,120,161],"encoder":[116],"stage":[117],"improved":[123],"Atrous":[124],"Spatial":[125],"Pyramid":[126],"Pooling":[127],"module":[128],"into":[129,151],"three":[130],"stages":[131],"fully":[133],"utilize":[134],"different":[136],"information":[138],"shallow":[141],"deep":[143],"layers.":[144],"Thirdly,":[145],"introduced":[150],"model,":[162],"mechanisms":[173],"explained.":[175],"Self":[176],"added":[179],"channel":[181],"enhances":[183],"connection":[185],"between":[186],"maps,":[188],"one-dimensional":[190],"convolution":[191],"spatial":[194,202],"increase":[200],"receptive":[203],"field.":[204],"The":[205],"final":[206],"results":[207],"public":[210],"dataset":[211],"PASCAL":[212],"VOC2012":[213],"SUIM":[215],"show":[216],"that":[217,228],"MIoUs":[218],"have":[219],"reached":[220],"86.68%":[221],"61.55%":[223],"respectively,":[224],"proved":[227],"proposed":[235],"higher":[240],"than":[241],"other":[242],"ones.":[243]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
