{"id":"https://openalex.org/W4404478955","doi":"https://doi.org/10.1145/3696952.3696984","title":"Fine-grained image recognition method based on enhanced multi-branch network","display_name":"Fine-grained image recognition method based on enhanced multi-branch network","publication_year":2024,"publication_date":"2024-11-18","ids":{"openalex":"https://openalex.org/W4404478955","doi":"https://doi.org/10.1145/3696952.3696984"},"language":"en","primary_location":{"id":"doi:10.1145/3696952.3696984","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3696952.3696984","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2024 9th International Conference on Intelligent Information Processing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3696952.3696984","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Ling Shen","orcid":"https://orcid.org/0009-0002-2613-8174"},"institutions":[{"id":"https://openalex.org/I14116566","display_name":"Wuhan Polytechnic University","ror":"https://ror.org/05w0e5j23","country_code":"CN","type":"education","lineage":["https://openalex.org/I14116566"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ling Shen","raw_affiliation_strings":["Wuhan City Polytechnic, Wuhan, Hubei, China"],"raw_orcid":"https://orcid.org/0009-0002-2613-8174","affiliations":[{"raw_affiliation_string":"Wuhan City Polytechnic, Wuhan, Hubei, China","institution_ids":["https://openalex.org/I14116566"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5111849188","display_name":"Shangkun Wang","orcid":"https://orcid.org/0009-0001-6296-189X"},"institutions":[{"id":"https://openalex.org/I4210130811","display_name":"Rajamangala University of Technology Tawan-ok","ror":"https://ror.org/03cvxzw02","country_code":"TH","type":"education","lineage":["https://openalex.org/I10245363","https://openalex.org/I4210130811"]}],"countries":["TH"],"is_corresponding":false,"raw_author_name":"Shougui Wang","raw_affiliation_strings":["Rajamangala University of Technology Tawan-Ok, Bangkok, Bangkok, Thailand"],"raw_orcid":"https://orcid.org/0009-0001-6296-189X","affiliations":[{"raw_affiliation_string":"Rajamangala University of Technology Tawan-Ok, Bangkok, Bangkok, Thailand","institution_ids":["https://openalex.org/I4210130811"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.3019928,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"233","last_page":"240"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13114","display_name":"Image Processing Techniques and Applications","score":0.9812999963760376,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13114","display_name":"Image Processing Techniques and Applications","score":0.9812999963760376,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9782999753952026,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12549","display_name":"Image and Object Detection Techniques","score":0.977400004863739,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7645012140274048},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5565680861473083},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.5408945083618164},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.45401421189308167},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4360900819301605}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7645012140274048},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5565680861473083},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.5408945083618164},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.45401421189308167},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4360900819301605}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3696952.3696984","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3696952.3696984","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2024 9th International Conference on Intelligent Information Processing","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3696952.3696984","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3696952.3696984","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2024 9th International Conference on Intelligent Information Processing","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W2104657103","https://openalex.org/W2737725206","https://openalex.org/W2807931652","https://openalex.org/W2891951760","https://openalex.org/W2963090248","https://openalex.org/W2964274719","https://openalex.org/W2997300818","https://openalex.org/W2997747012","https://openalex.org/W2998345525","https://openalex.org/W3034552520","https://openalex.org/W3034865111","https://openalex.org/W3081907075","https://openalex.org/W3126558081","https://openalex.org/W3175248300"],"related_works":["https://openalex.org/W2772917594","https://openalex.org/W2036807459","https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"The":[0,62],"key":[1,17,32,45],"of":[2,18,40,43,53,92,109,114,133,149,166,181,190,209,227,292],"fine-grained":[3,19,80,158],"image":[4,81,118,135,159,265],"recognition":[5,63,69,160],"is":[6,23,65,71,173,199,236,243],"to":[7,24,28,55,156,175,201,218,245,262],"extract":[8],"distinguished":[9],"visual":[10,20],"features.":[11],"Relevant":[12],"research":[13],"shows":[14],"that":[15],"the":[16,31,36,41,51,68,85,90,102,126,134,137,147,168,182,186,191,195,203,216,220,224,228,231,239,247,251,274,290,293],"classification":[21],"task":[22],"use":[25,50],"effective":[26],"methods":[27,49],"accurately":[29],"identify":[30],"information":[33,46,91,130,180,271],"areas":[34],"in":[35,84,101,136,161,215,295],"image.":[37],"In":[38],"view":[39],"idea":[42,52],"finding":[44],"regions,":[47,111],"many":[48],"detection-location-classification":[54],"find":[56],"target":[57,183],"locations":[58],"and":[59,87,116,120,124,128,206,223,238,250],"complete":[60],"classification.":[61],"speed":[64],"improved,":[66],"but":[67],"effect":[70],"not":[72],"accurate":[73,178,269],"enough.":[74],"Multi-branch":[75],"structure":[76],"can":[77,88],"learn":[78,176],"more":[79,177,268],"region":[82],"features":[83],"network,":[86],"fuse":[89],"different":[93],"branches.":[94],"However,":[95],"there":[96],"are":[97,213],"still":[98],"some":[99],"problems":[100],"existing":[103],"methods,":[104],"such":[105],"as":[106,261],"inaccurate":[107],"capture":[108],"detail":[110,115],"incomplete":[112],"extraction":[113,131],"overall":[117,127],"information,":[119],"excessive":[121],"computation.":[122],"Re-optimize":[123],"enhance":[125],"partial":[129],"ability":[132,226],"multi-branch":[138,144],"network.":[139,229],"This":[140],"study":[141],"proposes":[142],"a":[143,207],"network":[145,275],"with":[146,170,267],"introduction":[148],"Efficient":[150],"Channel":[151],"Attention":[152],"(ECA)":[153],"module":[154,172,233],"[4]":[155],"realize":[157],"weak":[162],"supervised":[163],"scenes.":[164],"First":[165],"all,":[167],"sub-network":[169],"ECA":[171,192],"introduced":[174],"coordinate":[179],"object":[184],"through":[185],"channel":[187,217],"attention":[188],"mechanism":[189],"sub-network.":[193],"Then,":[194],"deep":[196],"hyperparametric":[197],"convolution":[198,211,221],"used":[200,214,244],"replace":[202],"traditional":[204],"convolution,":[205],"variety":[208],"two-dimensional":[210],"cores":[212],"improve":[219],"performance":[222],"learning":[225],"Finally,":[230],"AAPM":[232],"without":[234,272],"training":[235],"introduced,":[237],"improved":[240],"sliding":[241],"window":[242],"represent":[246],"activation":[248],"value":[249],"distance":[252],"intersection":[253],"over":[254],"union":[255],"(DIoU)":[256],"loss":[257],"function":[258],"[5],":[259],"so":[260],"obtain":[263],"multiple":[264,286],"components":[266],"local":[270],"increasing":[273],"complexity.":[276],"Through":[277],"experimental":[278],"comparison,":[279],"good":[280],"results":[281],"have":[282],"been":[283],"achieved":[284],"on":[285],"data":[287],"sets,":[288],"proving":[289],"effectiveness":[291],"method":[294],"this":[296],"paper.":[297]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
