{"id":"https://openalex.org/W4382400441","doi":"https://doi.org/10.1093/comjnl/bxad063","title":"Spatial-Aware Multi-Directional Autoencoder For Pre-Training","display_name":"Spatial-Aware Multi-Directional Autoencoder For Pre-Training","publication_year":2023,"publication_date":"2023-06-27","ids":{"openalex":"https://openalex.org/W4382400441","doi":"https://doi.org/10.1093/comjnl/bxad063"},"language":"en","primary_location":{"id":"doi:10.1093/comjnl/bxad063","is_oa":false,"landing_page_url":"https://doi.org/10.1093/comjnl/bxad063","pdf_url":null,"source":{"id":"https://openalex.org/S44643521","display_name":"The Computer Journal","issn_l":"0010-4620","issn":["0010-4620","1460-2067"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The Computer Journal","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102743275","display_name":"Weiwei Yang","orcid":"https://orcid.org/0000-0002-0377-2626"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Weiwei Yang","raw_affiliation_strings":["The School of Data and Computer Science, Sun Yat-sen University, Guangzhou; Guangdong Key Laboratory of Big Data Analysis and Processing , Guangzhou 510006 , P.R.China","The School of Data and Computer Science, Sun Yat-sen University, Guangzhou"],"affiliations":[{"raw_affiliation_string":"The School of Data and Computer Science, Sun Yat-sen University, Guangzhou; Guangdong Key Laboratory of Big Data Analysis and Processing , Guangzhou 510006 , P.R.China","institution_ids":["https://openalex.org/I157773358"]},{"raw_affiliation_string":"The School of Data and Computer Science, Sun Yat-sen University, Guangzhou","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060335069","display_name":"Shangsong Liang","orcid":"https://orcid.org/0000-0003-1625-2168"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shangsong Liang","raw_affiliation_strings":["The School of Data and Computer Science, Sun Yat-sen University, Guangzhou; Guangdong Key Laboratory of Big Data Analysis and Processing , Guangzhou 510006 , P.R.China","The School of Data and Computer Science, Sun Yat-sen University, Guangzhou"],"affiliations":[{"raw_affiliation_string":"The School of Data and Computer Science, Sun Yat-sen University, Guangzhou; Guangdong Key Laboratory of Big Data Analysis and Processing , Guangzhou 510006 , P.R.China","institution_ids":["https://openalex.org/I157773358"]},{"raw_affiliation_string":"The School of Data and Computer Science, Sun Yat-sen University, Guangzhou","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5102961198","display_name":"Jian Yin","orcid":"https://orcid.org/0000-0002-4820-0226"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jian Yin","raw_affiliation_strings":["The School of Data and Computer Science, Sun Yat-sen University, Guangzhou; Guangdong Key Laboratory of Big Data Analysis and Processing , Guangzhou 510006 , P.R.China","The School of Data and Computer Science, Sun Yat-sen University, Guangzhou"],"affiliations":[{"raw_affiliation_string":"The School of Data and Computer Science, Sun Yat-sen University, Guangzhou; Guangdong Key Laboratory of Big Data Analysis and Processing , Guangzhou 510006 , P.R.China","institution_ids":["https://openalex.org/I157773358"]},{"raw_affiliation_string":"The School of Data and Computer Science, Sun Yat-sen University, Guangzhou","institution_ids":["https://openalex.org/I157773358"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5102743275"],"corresponding_institution_ids":["https://openalex.org/I157773358"],"apc_list":{"value":2635,"currency":"GBP","value_usd":3232},"apc_paid":null,"fwci":0.123,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.38805456,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"67","issue":"4","first_page":"1346","last_page":"1360"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11775","display_name":"COVID-19 diagnosis using AI","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.9252339601516724},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.7948078513145447},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7853759527206421},{"id":"https://openalex.org/keywords/pixel","display_name":"Pixel","score":0.5869797468185425},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5775228142738342},{"id":"https://openalex.org/keywords/spatial-contextual-awareness","display_name":"Spatial contextual awareness","score":0.5539752244949341},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.5037748217582703},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.50240159034729},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4646453559398651},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.44690555334091187},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.4264970123767853},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.08414006233215332}],"concepts":[{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.9252339601516724},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7948078513145447},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7853759527206421},{"id":"https://openalex.org/C160633673","wikidata":"https://www.wikidata.org/wiki/Q355198","display_name":"Pixel","level":2,"score":0.5869797468185425},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5775228142738342},{"id":"https://openalex.org/C64754055","wikidata":"https://www.wikidata.org/wiki/Q7574053","display_name":"Spatial contextual awareness","level":2,"score":0.5539752244949341},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.5037748217582703},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.50240159034729},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4646453559398651},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.44690555334091187},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4264970123767853},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.08414006233215332},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1093/comjnl/bxad063","is_oa":false,"landing_page_url":"https://doi.org/10.1093/comjnl/bxad063","pdf_url":null,"source":{"id":"https://openalex.org/S44643521","display_name":"The Computer Journal","issn_l":"0010-4620","issn":["0010-4620","1460-2067"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310311648","host_organization_name":"Oxford University Press","host_organization_lineage":["https://openalex.org/P4310311648","https://openalex.org/P4310311647"],"host_organization_lineage_names":["Oxford University Press","University of Oxford"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The Computer Journal","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1287980616","display_name":null,"funder_award_id":"U1811262","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2845204914","display_name":null,"funder_award_id":"U1811261","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2937404559","display_name":null,"funder_award_id":"U2001211","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4015785278","display_name":null,"funder_award_id":"2019B1515130001","funder_id":"https://openalex.org/F4320337111","funder_display_name":"Basic and Applied Basic Research Foundation of Guangdong Province"},{"id":"https://openalex.org/G6840496190","display_name":null,"funder_award_id":"U1811264","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8057543385","display_name":null,"funder_award_id":"U1911203","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320337111","display_name":"Basic and Applied Basic Research Foundation of Guangdong Province","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W967544008","https://openalex.org/W2507296351","https://openalex.org/W4221144677","https://openalex.org/W4382465386","https://openalex.org/W6638891565","https://openalex.org/W6639102338","https://openalex.org/W6676297131","https://openalex.org/W6700872662","https://openalex.org/W6720832695","https://openalex.org/W6729482032","https://openalex.org/W6735913928","https://openalex.org/W6736210646","https://openalex.org/W6743963275","https://openalex.org/W6746085279","https://openalex.org/W6748481559","https://openalex.org/W6753421600","https://openalex.org/W6760999690","https://openalex.org/W6763101540","https://openalex.org/W6765779288","https://openalex.org/W6768371451","https://openalex.org/W6769906684","https://openalex.org/W6770992763","https://openalex.org/W6775556278","https://openalex.org/W6779387320","https://openalex.org/W6779879114","https://openalex.org/W6780959388","https://openalex.org/W6784333009","https://openalex.org/W6786850268","https://openalex.org/W6786951733","https://openalex.org/W6787283782","https://openalex.org/W6787972765","https://openalex.org/W6788135285","https://openalex.org/W6788620109","https://openalex.org/W6790690058","https://openalex.org/W6792155083","https://openalex.org/W6792919013","https://openalex.org/W6794655914","https://openalex.org/W6796761347","https://openalex.org/W6803870738"],"related_works":["https://openalex.org/W2159052453","https://openalex.org/W3013693939","https://openalex.org/W2566616303","https://openalex.org/W3131327266","https://openalex.org/W4297051394","https://openalex.org/W2752972570","https://openalex.org/W2734887215","https://openalex.org/W2803255133","https://openalex.org/W2669956259","https://openalex.org/W4249005693"],"abstract_inverted_index":{"Abstract":[0],"Vision":[1],"Transformers":[2],"for":[3,12,36,78,87,97],"pre-trained":[4,38],"models":[5],"explore":[6,104],"semantic":[7,144],"context":[8],"and":[9,82,95,108,143],"spatial":[10,54],"relationships":[11],"images,":[13],"which":[14,91],"heavily":[15],"depend":[16],"on":[17,123],"how":[18],"you":[19],"select":[20],"image":[21,59,65,139,141],"patches.":[22],"In":[23],"this":[24],"paper,":[25],"we":[26],"propose":[27],"a":[28,37,57,63,73,83],"novel":[29],"Spatial-aware":[30,46],"Multi-directional":[31,47],"Patches":[32],"Multi-cycle":[33],"Autoencoder":[34],"(SMPMA)":[35],"model":[39,130],"that":[40,128],"brings":[41],"the":[42,79,88,136],"following":[43],"benefits:":[44],"(1)":[45],"(SM)":[48],"patches":[49,66,71,93,101,118],"are":[50],"created":[51],"with":[52],"multi-directional":[53],"locations,":[55],"transforming":[56],"whole":[58],"autoencoder":[60,67,75],"problem":[61],"into":[62],"short-span":[64],"problem;":[68],"(2)":[69],"SM":[70,100],"admit":[72],"self-cycle":[74],"alignment":[76],"learning":[77,86],"first":[80],"stage":[81],"cross-cycle":[84],"interaction":[85],"second":[89],"stage,":[90],"makes":[92],"align":[94],"interact":[96],"optimization;":[98],"(3)":[99],"enable":[102],"to":[103],"local":[105],"object":[106],"features":[107],"correlation":[109],"distribution":[110],"of":[111,138],"adjacent":[112],"pixels":[113],"by":[114],"taking":[115],"arbitrary":[116],"sampled":[117],"as":[119],"inputs.":[120],"Experimental":[121],"results":[122],"four":[124],"downstream":[125],"tasks":[126,137],"show":[127],"our":[129],"can":[131],"achieve":[132],"state-of-the-art":[133],"performance":[134],"over":[135],"generation,":[140],"classification":[142],"segmentation.":[145]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
