{"id":"https://openalex.org/W4413086908","doi":"https://doi.org/10.1142/s021800142554014x","title":"SRGAN-Based Input Enhancement and Attention-Guided YOLOv5s for Real-Time Excavator Pose Estimation","display_name":"SRGAN-Based Input Enhancement and Attention-Guided YOLOv5s for Real-Time Excavator Pose Estimation","publication_year":2025,"publication_date":"2025-07-17","ids":{"openalex":"https://openalex.org/W4413086908","doi":"https://doi.org/10.1142/s021800142554014x"},"language":"en","primary_location":{"id":"doi:10.1142/s021800142554014x","is_oa":false,"landing_page_url":"https://doi.org/10.1142/s021800142554014x","pdf_url":null,"source":{"id":"https://openalex.org/S41486457","display_name":"International Journal of Pattern Recognition and Artificial Intelligence","issn_l":"0218-0014","issn":["0218-0014","1793-6381"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319815","host_organization_name":"World Scientific","host_organization_lineage":["https://openalex.org/P4310319815"],"host_organization_lineage_names":["World Scientific"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Pattern Recognition and Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101864833","display_name":"Zeng Wang","orcid":null},"institutions":[{"id":"https://openalex.org/I137506752","display_name":"North China University of Science and Technology","ror":"https://ror.org/04z4wmb81","country_code":"CN","type":"education","lineage":["https://openalex.org/I137506752"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Wangting Zeng","raw_affiliation_strings":["College of Artificial Intelligence, North China University of Science and Technology, 21 Bohai Avenue, Caofeidian District, Tangshan 063210, Hebei, P.\u00a0R.\u00a0China"],"affiliations":[{"raw_affiliation_string":"College of Artificial Intelligence, North China University of Science and Technology, 21 Bohai Avenue, Caofeidian District, Tangshan 063210, Hebei, P.\u00a0R.\u00a0China","institution_ids":["https://openalex.org/I137506752"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107903947","display_name":"Qiushi Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I137506752","display_name":"North China University of Science and Technology","ror":"https://ror.org/04z4wmb81","country_code":"CN","type":"education","lineage":["https://openalex.org/I137506752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qixiang Huang","raw_affiliation_strings":["College of Artificial Intelligence, North China University of Science and Technology, 21 Bohai Avenue, Caofeidian District, Tangshan 063210, Hebei, P.\u00a0R.\u00a0China"],"affiliations":[{"raw_affiliation_string":"College of Artificial Intelligence, North China University of Science and Technology, 21 Bohai Avenue, Caofeidian District, Tangshan 063210, Hebei, P.\u00a0R.\u00a0China","institution_ids":["https://openalex.org/I137506752"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044063530","display_name":"Ke Wu","orcid":"https://orcid.org/0000-0001-5533-2772"},"institutions":[{"id":"https://openalex.org/I137506752","display_name":"North China University of Science and Technology","ror":"https://ror.org/04z4wmb81","country_code":"CN","type":"education","lineage":["https://openalex.org/I137506752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ke Wu","raw_affiliation_strings":["College of Artificial Intelligence, North China University of Science and Technology, 21 Bohai Avenue, Caofeidian District, Tangshan 063210, Hebei, P.\u00a0R.\u00a0China"],"affiliations":[{"raw_affiliation_string":"College of Artificial Intelligence, North China University of Science and Technology, 21 Bohai Avenue, Caofeidian District, Tangshan 063210, Hebei, P.\u00a0R.\u00a0China","institution_ids":["https://openalex.org/I137506752"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100646178","display_name":"Xuedong Zhang","orcid":"https://orcid.org/0009-0001-3454-1273"},"institutions":[{"id":"https://openalex.org/I137506752","display_name":"North China University of Science and Technology","ror":"https://ror.org/04z4wmb81","country_code":"CN","type":"education","lineage":["https://openalex.org/I137506752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuedong Zhang","raw_affiliation_strings":["College of Artificial Intelligence, North China University of Science and Technology, 21 Bohai Avenue, Caofeidian District, Tangshan 063210, Hebei, P.\u00a0R.\u00a0China"],"affiliations":[{"raw_affiliation_string":"College of Artificial Intelligence, North China University of Science and Technology, 21 Bohai Avenue, Caofeidian District, Tangshan 063210, Hebei, P.\u00a0R.\u00a0China","institution_ids":["https://openalex.org/I137506752"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5102313055","display_name":"Bo Cui","orcid":null},"institutions":[{"id":"https://openalex.org/I4210115299","display_name":"TED University","ror":"https://ror.org/0285rh439","country_code":"TR","type":"education","lineage":["https://openalex.org/I4210115299"]},{"id":"https://openalex.org/I137506752","display_name":"North China University of Science and Technology","ror":"https://ror.org/04z4wmb81","country_code":"CN","type":"education","lineage":["https://openalex.org/I137506752"]}],"countries":["CN","TR"],"is_corresponding":false,"raw_author_name":"Bo Cui","raw_affiliation_strings":["Hebei Key Laboratory of Industrial Intelligent Perception, College of Artificial Intelligence, North China University of Science and Technology, 21 Bohai Avenue, Caofeidian District, Tangshan 063210, Hebei, P.\u00a0R.\u00a0China"],"affiliations":[{"raw_affiliation_string":"Hebei Key Laboratory of Industrial Intelligent Perception, College of Artificial Intelligence, North China University of Science and Technology, 21 Bohai Avenue, Caofeidian District, Tangshan 063210, Hebei, P.\u00a0R.\u00a0China","institution_ids":["https://openalex.org/I137506752","https://openalex.org/I4210115299"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101864833"],"corresponding_institution_ids":["https://openalex.org/I137506752"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.29451689,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"39","issue":"13","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9771999716758728,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9771999716758728,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.9592000246047974,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11687","display_name":"Teleoperation and Haptic Systems","score":0.9373000264167786,"subfield":{"id":"https://openalex.org/subfields/2210","display_name":"Mechanical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/excavator","display_name":"Excavator","score":0.9003496170043945},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6960797905921936},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6959478259086609},{"id":"https://openalex.org/keywords/estimation","display_name":"Estimation","score":0.510723352432251},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.47597306966781616},{"id":"https://openalex.org/keywords/pose","display_name":"Pose","score":0.45061954855918884},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4067501425743103},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3391941785812378},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.12488600611686707}],"concepts":[{"id":"https://openalex.org/C141392084","wikidata":"https://www.wikidata.org/wiki/Q182661","display_name":"Excavator","level":2,"score":0.9003496170043945},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6960797905921936},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6959478259086609},{"id":"https://openalex.org/C96250715","wikidata":"https://www.wikidata.org/wiki/Q965330","display_name":"Estimation","level":2,"score":0.510723352432251},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.47597306966781616},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.45061954855918884},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4067501425743103},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3391941785812378},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.12488600611686707},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1142/s021800142554014x","is_oa":false,"landing_page_url":"https://doi.org/10.1142/s021800142554014x","pdf_url":null,"source":{"id":"https://openalex.org/S41486457","display_name":"International Journal of Pattern Recognition and Artificial Intelligence","issn_l":"0218-0014","issn":["0218-0014","1793-6381"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319815","host_organization_name":"World Scientific","host_organization_lineage":["https://openalex.org/P4310319815"],"host_organization_lineage_names":["World Scientific"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Pattern Recognition and Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W2026782279","https://openalex.org/W2900055483","https://openalex.org/W2903099067","https://openalex.org/W2947223272","https://openalex.org/W2995932445","https://openalex.org/W3049455165","https://openalex.org/W3132694240","https://openalex.org/W3146366485","https://openalex.org/W3160412534","https://openalex.org/W3166023678","https://openalex.org/W3197793211","https://openalex.org/W4293094637","https://openalex.org/W4312349930","https://openalex.org/W4385710061","https://openalex.org/W4388362190","https://openalex.org/W4388672590","https://openalex.org/W4390883606","https://openalex.org/W4398756379"],"related_works":["https://openalex.org/W3003601017","https://openalex.org/W2038528908","https://openalex.org/W2997898942","https://openalex.org/W2997279469","https://openalex.org/W2901741596","https://openalex.org/W2363098002","https://openalex.org/W2347606691","https://openalex.org/W2391703932","https://openalex.org/W2370050348","https://openalex.org/W2353530107"],"abstract_inverted_index":{"The":[0,75,163],"measurement":[1,26],"of":[2,56,70,84,98,141,150,153,157],"excavator":[3,11,18,58,173],"pose":[4,19,25,37,60,63,174],"information":[5,64],"is":[6,65,78,104],"crucial":[7],"for":[8,87,117,172],"advancing":[9],"intelligent":[10],"control":[12],"systems.":[13],"To":[14],"address":[15],"challenges":[16],"in":[17,120,176],"detection":[20,55,113,139,175],"\u2014":[21,31],"such":[22],"as":[23,106],"small":[24,118],"targets":[27,119],"and":[28,115,155,167],"blurred":[29],"images":[30],"a":[32,138,145],"high-speed,":[33],"high-accuracy":[34],"visual":[35],"technology-based":[36],"recognition":[38],"algorithm,":[39,135],"super-resolution":[40],"input-YOLOv5s,":[41],"was":[42],"developed.":[43],"This":[44],"algorithm":[45],"includes":[46],"an":[47],"image":[48,73],"target":[49,72],"designed":[50],"specifically":[51],"to":[52,80,110],"facilitate":[53],"the":[54,57,68,71,82,95,99,107,112,133,160,170],"arm\u2019s":[59],"angles.":[61],"Excavator":[62],"derived":[66],"through":[67],"analysis":[69],"data.":[74],"SRGAN":[76],"model":[77],"used":[79],"enhance":[81],"quality":[83],"input":[85],"data":[86],"YOLOv5,":[88],"while":[89,124],"attention":[90],"mechanisms":[91],"are":[92],"introduced":[93],"at":[94],"terminal":[96],"stage":[97],"backbone":[100],"network.":[101],"Focal":[102],"loss":[103,108],"employed":[105],"function":[109],"improve":[111],"accuracy":[114],"stability":[116],"complex":[121],"construction":[122],"environments,":[123],"also":[125],"mitigating":[126],"class":[127],"imbalance.":[128],"Experimental":[129],"results":[130],"demonstrate":[131],"that":[132],"improved":[134],"SRI-YOLOv5s,":[136],"achieved":[137],"speed":[140],"59.20":[142],"FPS,":[143],"with":[144],"mean":[146],"average":[147],"precision":[148,152],"(mAP)":[149],"89.46%,":[151],"91.7%,":[154],"recall":[156],"92.1%,":[158],"outperforming":[159],"original":[161],"model.":[162],"model\u2019s":[164],"real-time":[165],"performance":[166],"robustness":[168],"meet":[169],"requirements":[171],"practical":[177],"environments.":[178]},"counts_by_year":[],"updated_date":"2025-12-28T23:10:05.387466","created_date":"2025-10-10T00:00:00"}
