{"id":"https://openalex.org/W4401210950","doi":"https://doi.org/10.1080/01691864.2024.2381812","title":"Co-scale cross-attentional transformer for rearrangement target detection","display_name":"Co-scale cross-attentional transformer for rearrangement target detection","publication_year":2024,"publication_date":"2024-08-01","ids":{"openalex":"https://openalex.org/W4401210950","doi":"https://doi.org/10.1080/01691864.2024.2381812"},"language":"en","primary_location":{"id":"doi:10.1080/01691864.2024.2381812","is_oa":false,"landing_page_url":"https://doi.org/10.1080/01691864.2024.2381812","pdf_url":null,"source":{"id":"https://openalex.org/S192584203","display_name":"Advanced Robotics","issn_l":"0169-1864","issn":["0169-1864","1568-5535"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320547","host_organization_name":"Taylor & Francis","host_organization_lineage":["https://openalex.org/P4310320547"],"host_organization_lineage_names":["Taylor & Francis"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Advanced Robotics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102166385","display_name":"Haruka Matsuo","orcid":"https://orcid.org/0009-0003-5617-507X"},"institutions":[{"id":"https://openalex.org/I203951103","display_name":"Keio University","ror":"https://ror.org/02kn6nx58","country_code":"JP","type":"education","lineage":["https://openalex.org/I203951103"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Haruka Matsuo","raw_affiliation_strings":["Faculty of Science and Technology, Keio University, Yokohama, Kanagawa, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Science and Technology, Keio University, Yokohama, Kanagawa, Japan","institution_ids":["https://openalex.org/I203951103"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041072699","display_name":"Shintaro Ishikawa","orcid":"https://orcid.org/0000-0002-6763-5583"},"institutions":[{"id":"https://openalex.org/I203951103","display_name":"Keio University","ror":"https://ror.org/02kn6nx58","country_code":"JP","type":"education","lineage":["https://openalex.org/I203951103"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Shintaro Ishikawa","raw_affiliation_strings":["Faculty of Science and Technology, Keio University, Yokohama, Kanagawa, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Faculty of Science and Technology, Keio University, Yokohama, Kanagawa, Japan","institution_ids":["https://openalex.org/I203951103"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5033744547","display_name":"Komei Sugiura","orcid":"https://orcid.org/0000-0002-0261-0510"},"institutions":[{"id":"https://openalex.org/I203951103","display_name":"Keio University","ror":"https://ror.org/02kn6nx58","country_code":"JP","type":"education","lineage":["https://openalex.org/I203951103"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Komei Sugiura","raw_affiliation_strings":["Faculty of Science and Technology, Keio University, Yokohama, Kanagawa, Japan"],"raw_orcid":"https://orcid.org/0000-0002-0261-0510","affiliations":[{"raw_affiliation_string":"Faculty of Science and Technology, Keio University, Yokohama, Kanagawa, Japan","institution_ids":["https://openalex.org/I203951103"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5102166385"],"corresponding_institution_ids":["https://openalex.org/I203951103"],"apc_list":null,"apc_paid":null,"fwci":0.2381,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.49953613,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"38","issue":"18","first_page":"1277","last_page":"1286"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6282548308372498},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6230570673942566},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.6029669642448425},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5785704851150513},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.5262441039085388},{"id":"https://openalex.org/keywords/change-detection","display_name":"Change detection","score":0.45731493830680847},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.4258202314376831},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3691069781780243},{"id":"https://openalex.org/keywords/voltage","display_name":"Voltage","score":0.1521826684474945},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.1506597399711609}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6282548308372498},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6230570673942566},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.6029669642448425},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5785704851150513},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5262441039085388},{"id":"https://openalex.org/C203595873","wikidata":"https://www.wikidata.org/wiki/Q25389927","display_name":"Change detection","level":2,"score":0.45731493830680847},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.4258202314376831},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3691069781780243},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.1521826684474945},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.1506597399711609},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1080/01691864.2024.2381812","is_oa":false,"landing_page_url":"https://doi.org/10.1080/01691864.2024.2381812","pdf_url":null,"source":{"id":"https://openalex.org/S192584203","display_name":"Advanced Robotics","issn_l":"0169-1864","issn":["0169-1864","1568-5535"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320547","host_organization_name":"Taylor & Francis","host_organization_lineage":["https://openalex.org/P4310320547"],"host_organization_lineage_names":["Taylor & Francis"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Advanced Robotics","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G3385511879","display_name":null,"funder_award_id":"23K03478","funder_id":"https://openalex.org/F4320334764","funder_display_name":"Japan Society for the Promotion of Science"}],"funders":[{"id":"https://openalex.org/F4320321680","display_name":"New Energy and Industrial Technology Development Organization","ror":"https://ror.org/0055k7a87"},{"id":"https://openalex.org/F4320334764","display_name":"Japan Society for the Promotion of Science","ror":"https://ror.org/00hhkn466"},{"id":"https://openalex.org/F4320338247","display_name":"Moonshot Research and Development Program","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W764651262","https://openalex.org/W2015241127","https://openalex.org/W2193945050","https://openalex.org/W2194775991","https://openalex.org/W2317688867","https://openalex.org/W2560311620","https://openalex.org/W2736647539","https://openalex.org/W2789688775","https://openalex.org/W2911966516","https://openalex.org/W2914666560","https://openalex.org/W2962914239","https://openalex.org/W3004423752","https://openalex.org/W3010257550","https://openalex.org/W3027201985","https://openalex.org/W3048064159","https://openalex.org/W3090836511","https://openalex.org/W3134460763","https://openalex.org/W3138516171","https://openalex.org/W3156855646","https://openalex.org/W3173760279","https://openalex.org/W3176330035","https://openalex.org/W3186032668","https://openalex.org/W3186239158","https://openalex.org/W3210193870","https://openalex.org/W4214709605","https://openalex.org/W4224932139","https://openalex.org/W4312549298","https://openalex.org/W4312696712","https://openalex.org/W4390874575"],"related_works":["https://openalex.org/W2568858292","https://openalex.org/W1515964938","https://openalex.org/W2389381914","https://openalex.org/W2376528221","https://openalex.org/W196800607","https://openalex.org/W4390516098","https://openalex.org/W2359428812","https://openalex.org/W3181296946","https://openalex.org/W2181948922","https://openalex.org/W2015705630"],"abstract_inverted_index":{"Rearranging":[0],"objects":[1,31,62,88,102],"(e.g.":[2],"vase,":[3],"door)":[4],"back":[5],"in":[6,73,98],"their":[7],"original":[8],"positions":[9],"is":[10,26],"one":[11],"of":[12,76,101,127,130,153],"the":[13,30,39,55,74,96,99,122,134,139,142,160,170,173],"most":[14,81],"fundamental":[15],"skills":[16],"for":[17,61,118],"domestic":[18],"service":[19],"robots":[20],"(DSRs).":[21],"In":[22,44,109],"rearrangement":[23],"tasks,":[24],"it":[25],"crucial":[27],"to":[28,34,38,86,94],"detect":[29,95],"that":[32,63,103,176],"need":[33],"be":[35,65,105],"rearranged":[36],"according":[37],"goal":[40,143,161],"and":[41,92,133,144,156,162,172,184],"current":[42,145,163],"states.":[43,146,164],"this":[45,110],"study,":[46,111],"we":[47,112],"focus":[48],"on":[49,169,182],"Rearrangement":[50],"Target":[51],"Detection":[52,79],"(RTD),":[53],"where":[54],"model":[56],"generates":[57],"a":[58,114,128,149],"change":[59,97,157],"mask":[60],"should":[64],"rearranged.":[66],"Although":[67],"many":[68],"studies":[69],"have":[70],"been":[71],"conducted":[72],"field":[75],"Scene":[77],"Change":[78],"(SCD),":[80],"SCD":[82],"methods":[83,181],"often":[84],"fail":[85,93],"segment":[87],"with":[89],"complex":[90],"shapes":[91],"angle":[100],"can":[104],"opened":[106],"or":[107],"closed.":[108],"propose":[113],"Co-Scale":[115],"Cross-Attentional":[116,135],"Transformer":[117],"RTD.":[119],"We":[120,147,165],"introduce":[121],"Serial":[123],"Encoder":[124,136],"which":[125,137],"consists":[126],"sequence":[129],"serial":[131],"blocks":[132],"models":[138],"relationship":[140],"between":[141],"built":[148],"new":[150],"dataset":[151,171],"consisting":[152],"RGB":[154],"images":[155],"masks":[158],"regarding":[159],"validated":[166],"our":[167,177],"method":[168,178],"results":[174],"demonstrated":[175],"outperformed":[179],"baseline":[180],"F1-score":[183],"mean":[185],"IoU.":[186]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-10T02:45:41.426853","created_date":"2025-10-10T00:00:00"}
