{"id":"https://openalex.org/W4386737313","doi":"https://doi.org/10.1109/tim.2023.3315355","title":"YOLO-MSA: A Multiscale Stereoscopic Attention Network for Empty-Dish Recycling Robots","display_name":"YOLO-MSA: A Multiscale Stereoscopic Attention Network for Empty-Dish Recycling Robots","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4386737313","doi":"https://doi.org/10.1109/tim.2023.3315355"},"language":"en","primary_location":{"id":"doi:10.1109/tim.2023.3315355","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tim.2023.3315355","pdf_url":null,"source":{"id":"https://openalex.org/S10892749","display_name":"IEEE Transactions on Instrumentation and Measurement","issn_l":"0018-9456","issn":["0018-9456","1557-9662"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Instrumentation and Measurement","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5090899188","display_name":"Xuebin Yue","orcid":"https://orcid.org/0000-0002-4356-9243"},"institutions":[{"id":"https://openalex.org/I135768898","display_name":"Ritsumeikan University","ror":"https://ror.org/0197nmd03","country_code":"JP","type":"education","lineage":["https://openalex.org/I135768898","https://openalex.org/I4390039241"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Xuebin Yue","raw_affiliation_strings":["Research Organization of Science and Technology, Ritsumeikan University, Kusatsu, Japan"],"affiliations":[{"raw_affiliation_string":"Research Organization of Science and Technology, Ritsumeikan University, Kusatsu, Japan","institution_ids":["https://openalex.org/I135768898"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5076579498","display_name":"Lin Meng","orcid":"https://orcid.org/0000-0003-4351-6923"},"institutions":[{"id":"https://openalex.org/I135768898","display_name":"Ritsumeikan University","ror":"https://ror.org/0197nmd03","country_code":"JP","type":"education","lineage":["https://openalex.org/I135768898","https://openalex.org/I4390039241"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Lin Meng","raw_affiliation_strings":["College of Science and Engineering, Ritsumeikan University, Kusatsu, Japan"],"affiliations":[{"raw_affiliation_string":"College of Science and Engineering, Ritsumeikan University, Kusatsu, Japan","institution_ids":["https://openalex.org/I135768898"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5090899188"],"corresponding_institution_ids":["https://openalex.org/I135768898"],"apc_list":null,"apc_paid":null,"fwci":2.4597,"has_fulltext":false,"cited_by_count":20,"citation_normalized_percentile":{"value":0.91146959,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"72","issue":null,"first_page":"1","last_page":"14"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9886000156402588,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9886000156402588,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12111","display_name":"Industrial Vision Systems and Defect Detection","score":0.9693999886512756,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.9564999938011169,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6514137983322144},{"id":"https://openalex.org/keywords/stereoscopy","display_name":"Stereoscopy","score":0.5571416020393372},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.5047422647476196},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.4421626925468445},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.43696433305740356},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4128498435020447},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.38477692008018494},{"id":"https://openalex.org/keywords/cartography","display_name":"Cartography","score":0.17513924837112427},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.13666009902954102}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6514137983322144},{"id":"https://openalex.org/C126057942","wikidata":"https://www.wikidata.org/wiki/Q35158","display_name":"Stereoscopy","level":2,"score":0.5571416020393372},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.5047422647476196},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.4421626925468445},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.43696433305740356},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4128498435020447},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.38477692008018494},{"id":"https://openalex.org/C58640448","wikidata":"https://www.wikidata.org/wiki/Q42515","display_name":"Cartography","level":1,"score":0.17513924837112427},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.13666009902954102},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tim.2023.3315355","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tim.2023.3315355","pdf_url":null,"source":{"id":"https://openalex.org/S10892749","display_name":"IEEE Transactions on Instrumentation and Measurement","issn_l":"0018-9456","issn":["0018-9456","1557-9662"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Instrumentation and Measurement","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/8","score":0.7300000190734863,"display_name":"Decent work and economic growth"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":47,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1536680647","https://openalex.org/W2097117768","https://openalex.org/W2102605133","https://openalex.org/W2109255472","https://openalex.org/W2183341477","https://openalex.org/W2193145675","https://openalex.org/W2194775991","https://openalex.org/W2752782242","https://openalex.org/W2884585870","https://openalex.org/W2928165649","https://openalex.org/W2963125010","https://openalex.org/W2963351448","https://openalex.org/W2963446712","https://openalex.org/W2963857746","https://openalex.org/W3018757597","https://openalex.org/W3034552520","https://openalex.org/W3042011474","https://openalex.org/W3106250896","https://openalex.org/W3108705364","https://openalex.org/W3125311193","https://openalex.org/W3126855404","https://openalex.org/W3136838953","https://openalex.org/W3169834292","https://openalex.org/W3184439416","https://openalex.org/W4213350031","https://openalex.org/W4224325915","https://openalex.org/W4281790833","https://openalex.org/W4285176535","https://openalex.org/W4286111650","https://openalex.org/W4286306527","https://openalex.org/W4293584584","https://openalex.org/W4312443937","https://openalex.org/W4313495634","https://openalex.org/W4313549235","https://openalex.org/W4319865456","https://openalex.org/W4321016398","https://openalex.org/W4322747009","https://openalex.org/W4364320749","https://openalex.org/W4386076325","https://openalex.org/W6620707391","https://openalex.org/W6750227808","https://openalex.org/W6753412334","https://openalex.org/W6777046832","https://openalex.org/W6798838024","https://openalex.org/W6838547440","https://openalex.org/W6849884611"],"related_works":["https://openalex.org/W1536158975","https://openalex.org/W2393788985","https://openalex.org/W2157670837","https://openalex.org/W4377836769","https://openalex.org/W2374120702","https://openalex.org/W2631594184","https://openalex.org/W1983607852","https://openalex.org/W2072849536","https://openalex.org/W1531686125","https://openalex.org/W2322721455"],"abstract_inverted_index":{"As":[0],"the":[1,6,34,37,61,72,76,115,138,141,167,196,202,206,218,248],"global":[2],"population":[3],"ages":[4],"and":[5,91,178,237,243],"labor":[7,17,40],"force":[8],"shrinks,":[9],"using":[10],"Artificial":[11],"Intelligence":[12],"(AI)":[13],"technology":[14],"to":[15,52,97,128],"promote":[16],"productivity":[18],"growth":[19],"has":[20,31,151,179,221,244],"become":[21],"a":[22,45,67,79,85,92,119,164,222],"hot":[23],"topic.":[24],"The":[25],"emergence":[26],"of":[27,36,75,132,140,166,184,198,201,250],"Empty-Dish":[28,57,207,251],"Recycling":[29,58,208,252],"Robots":[30],"effectively":[32],"alleviated":[33],"impact":[35],"decline":[38],"in":[39,114,239],"productivity.":[41],"This":[42],"paper":[43],"proposes":[44],"Multi-scale":[46],"Stereoscopic":[47],"Attention":[48],"(MSA)":[49],"network":[50,77],"YOLO-MSA":[51,150,220,228],"detect":[53],"postprandial":[54,168,203,240],"dishes":[55],"for":[56,105,110,145,205,247],"Robots.":[59,253],"First,":[60],"standard":[62],"convolution":[63],"is":[64,103,126,171],"replaced":[65],"with":[66,87],"Res2Net":[68,86],"module,":[69,101],"which":[70,102,170,194],"improves":[71],"multi-scale":[73,107,111,146,231],"expressiveness":[74],"at":[78],"finer-grained":[80],"level.":[81],"Second,":[82],"we":[83],"adopt":[84],"different":[88,133],"dilation":[89],"rates":[90],"novel":[93],"stereoscopic":[94],"attention":[95],"mechanism":[96],"propose":[98],"an":[99,181],"MSA":[100,143],"used":[104],"coarse-grained":[106],"expression.":[108],"Thirdly,":[109],"feature":[112,130,147,232],"learning":[113],"dimensionality":[116],"reduction":[117],"process,":[118],"Dimension":[120],"Reduction":[121],"Spatial":[122],"Pyramid":[123],"Pooling":[124],"(DRSPP)":[125],"proposed":[127,142,219],"fuse":[129],"maps":[131],"scales.":[134],"Extensive":[135],"experiments":[136],"demonstrate":[137],"effectiveness":[139,236],"module":[144],"learning.":[148],"Furthermore,":[149],"achieved":[152,180],"98.47%":[153],"mean":[154],"Average":[155],"Precision":[156],"(":[157,189],"<italic":[158,190],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[159,191],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">mAP</i>":[160],")":[161],"on":[162,212],"Dish-21,":[163],"dataset":[165],"dishes,":[169],"much":[172],"higher":[173],"than":[174],"other":[175,213],"state-of-the-art":[176],"models,":[177],"inference":[182],"speed":[183],"33.93":[185],"frames":[186],"per":[187],"second":[188],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">FPS</i>":[192],"),":[193],"meets":[195],"needs":[197],"real-time":[199],"detection":[200],"dish":[204,241],"Robot.":[209],"Test":[210],"results":[211],"public":[214],"datasets":[215],"show":[216],"that":[217],"better":[223],"generalization":[224],"ability.":[225],"In":[226],"summary,":[227],"exhibits":[229],"satisfactory":[230],"expression":[233],"ability,":[234],"demonstrates":[235],"robustness":[238],"detection,":[242],"far-reaching":[245],"significance":[246],"development":[249]},"counts_by_year":[{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":14},{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
