{"id":"https://openalex.org/W7133344780","doi":"https://doi.org/10.48550/arxiv.2603.01036","title":"SMR-Net:Robot Snap Detection Based on Multi-Scale Features and Self-Attention Network","display_name":"SMR-Net:Robot Snap Detection Based on Multi-Scale Features and Self-Attention Network","publication_year":2026,"publication_date":"2026-03-01","ids":{"openalex":"https://openalex.org/W7133344780","doi":"https://doi.org/10.48550/arxiv.2603.01036"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.01036","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.01036","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.01036","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128002455","display_name":"Kuanxu Hou","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Hou, Kuanxu","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5128002455"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.6051999926567078,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.6051999926567078,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.16140000522136688,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12111","display_name":"Industrial Vision Systems and Defect Detection","score":0.0414000004529953,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.678600013256073},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.5997999906539917},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.46880000829696655},{"id":"https://openalex.org/keywords/convolution","display_name":"Convolution (computer science)","score":0.4408999979496002},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4381999969482422},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.43709999322891235},{"id":"https://openalex.org/keywords/dimension","display_name":"Dimension (graph theory)","score":0.42410001158714294},{"id":"https://openalex.org/keywords/sensor-fusion","display_name":"Sensor fusion","score":0.41290000081062317},{"id":"https://openalex.org/keywords/unification","display_name":"Unification","score":0.40790000557899475}],"concepts":[{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.678600013256073},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6780999898910522},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.5997999906539917},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5440999865531921},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.46880000829696655},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4449999928474426},{"id":"https://openalex.org/C45347329","wikidata":"https://www.wikidata.org/wiki/Q5166604","display_name":"Convolution (computer science)","level":3,"score":0.4408999979496002},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4381999969482422},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.43709999322891235},{"id":"https://openalex.org/C33676613","wikidata":"https://www.wikidata.org/wiki/Q13415176","display_name":"Dimension (graph theory)","level":2,"score":0.42410001158714294},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.41290000081062317},{"id":"https://openalex.org/C96146094","wikidata":"https://www.wikidata.org/wiki/Q609057","display_name":"Unification","level":2,"score":0.40790000557899475},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.38999998569488525},{"id":"https://openalex.org/C64543145","wikidata":"https://www.wikidata.org/wiki/Q162942","display_name":"Intersection (aeronautics)","level":2,"score":0.3743000030517578},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.36160001158714294},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.3580999970436096},{"id":"https://openalex.org/C2779997099","wikidata":"https://www.wikidata.org/wiki/Q7547253","display_name":"Snap","level":2,"score":0.328900009393692},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.3156999945640564},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.30070000886917114},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.28380000591278076},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.27869999408721924},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2786000072956085},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.26489999890327454},{"id":"https://openalex.org/C52102323","wikidata":"https://www.wikidata.org/wiki/Q1671968","display_name":"Pose","level":2,"score":0.2623000144958496},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.26190000772476196},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.2603999972343445},{"id":"https://openalex.org/C99862985","wikidata":"https://www.wikidata.org/wiki/Q10858068","display_name":"Production line","level":2,"score":0.2533999979496002}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.01036","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.01036","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.01036","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.01036","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"In":[0],"robot":[1],"automated":[2],"assembly,":[3],"snap":[4,18,99,149,186],"assembly":[5,25,51],"precision":[6],"and":[7,20,34,62,75,101,114,138,146,165,167,175,188],"efficiency":[8],"directly":[9],"determine":[10],"overall":[11],"production":[12],"quality.":[13],"As":[14],"a":[15,59],"core":[16],"prerequisite,":[17],"detection":[19,69,74,187],"localization":[21,36,76,189],"critically":[22],"affect":[23],"subsequent":[24],"success.":[26],"Traditional":[27],"visual":[28],"methods":[29],"suffer":[30],"from":[31],"poor":[32],"robustness":[33],"large":[35],"errors":[37],"when":[38],"handling":[39],"complex":[40,185],"scenarios":[41],"(e.g.,":[42],"transparent":[43],"or":[44],"low-contrast":[45],"snaps),":[46],"failing":[47],"to":[48,71,96,130],"meet":[49],"high-precision":[50],"demands.":[52],"To":[53],"address":[54],"this,":[55],"this":[56],"paper":[57],"designs":[58],"dedicated":[60],"sensor":[61,87],"proposes":[63],"SMR-Net,":[64],"an":[65,80,92,123],"self-attention-based":[66],"multi-scale":[67,82,105],"object":[68],"algorithm,":[70],"synergistically":[72],"enhance":[73],"performance.":[77],"SMR-Net":[78,152],"adopts":[79],"attention-enhanced":[81],"feature":[83,94,106],"fusion":[84],"architecture:":[85],"raw":[86],"data":[88],"is":[89],"encoded":[90],"via":[91],"attention-embedded":[93],"extractor":[95],"strengthen":[97],"key":[98],"features":[100],"suppress":[102],"noise;":[103],"three":[104],"maps":[107],"are":[108],"processed":[109],"in":[110,184],"parallel":[111],"with":[112],"standard":[113],"dilated":[115],"convolution":[116],"for":[117],"dimension":[118],"unification":[119],"while":[120],"preserving":[121],"resolution;":[122],"adaptive":[124],"reweighting":[125],"network":[126],"dynamically":[127],"assigns":[128],"weights":[129],"fused":[131],"features,":[132],"generating":[133],"fine":[134],"representations":[135],"integrating":[136],"details":[137],"global":[139],"semantics.":[140],"Experimental":[141],"results":[142],"on":[143],"Type":[144,147],"A":[145],"B":[148],"datasets":[150],"show":[151],"outperforms":[153],"traditional":[154],"Faster":[155],"R-CNN":[156],"significantly:":[157],"Intersection":[158],"over":[159],"Union":[160],"(IoU)":[161],"improves":[162],"by":[163,173],"6.52%":[164],"5.8%,":[166],"mean":[168],"Average":[169],"Precision":[170],"(mAP)":[171],"increases":[172],"2.8%":[174],"1.5%":[176],"respectively.":[177],"This":[178],"fully":[179],"demonstrates":[180],"the":[181],"method's":[182],"superiority":[183],"tasks.":[190]},"counts_by_year":[],"updated_date":"2026-03-04T07:09:34.246503","created_date":"2026-03-04T00:00:00"}
